In [1]:
from classy import *
Version: 0.0.15
In [2]:
sequence_data=bio.load_sequences('data/small sequence dataset.xlsx')
Target Column Found
Sequences
88 sequences of median length 288
Unique letters: [ 'MRKFNKPLLALLIGSTLCSAAQAAAPGKPTIAWGNTKFAIVEVDQAATAYNNLVKVKNAADVSVSWNLWNGDAGTTAKILLNGKEAWSGPSTGSSGTANFKVNKGGRYQMQVALCNADGCTASDATEIVVADTDGSHLAPLKEPLLEKNKPYKQNSGKVVGSYFVEWGVYGRNFTVDKIPAQNLTHLLYGFIPICGGNGINDSLKEIEGSFQALQRSCQGREDFKVSIHDPFAALQKAQKGVTAWDDPYKGNFGQLMALKQAHPDLKILPSIGGWTLSDPFFFMGDKVKRDRFVGSVKEFLQTWKFFDGVDIDWEFPGGKGANPNLGSPQDGETYVLLMKELRAMLDQLSAETGRKYELTSAISAGKDKIDKVAYNVAQNSMDHIFLMSYDFYGPFDLKNLGHQTALNAPAWKPDTAYTTVNGVNALLAQGVKPGKVVVGTAMYGRGWTGVNGYQNNIPFTGTATGPVKGTWKNGIVDYRQIAGQFMSGEWQYTYDATAEAPYVFKPSTGDLITFDDARSVQAKGKYVLDKQLGGLFSWEIDADNGDILNSMNASLGNSAGVQMSTRKAVIGYYFIPTNQINNYTETDTSVVPFPVSNITPAKAKQLTHINFSFLDINSNLECAWDPATNDAKARDVVNRLTALKAHNPSLRIMFSIGGWYYSNDLGVSHANYVNAVKTPAARTKFAQSCVRIMKDYGFDGVDIDWEYPQAAEVDGFIAALQEIRTLLNQQTIADGRQALPYQLTIAGAGGAFFLSRYYSKLAQIVAPLDYINLMTYDLAGPWEKITNHQAALFGDAAGPTFYNALREANLGWSWEELTRAFPSPFSLTVDAAVQQHLMMEGVPSAKIVMGVPFYGRAFKGVSGGNGGQYSSHSTPGEDPYPNADYWLVGCDECVRDKDPRIASYRQLEQMLQGNYGYQRLWNDKTKTPYLYHAQNGLFVTYDDAESFKYKAKYIKQQQLGGVMFWHLGQDNRNGDLLAALDRYFNAADYDDSQLDMGTGLRYTGVGPGNLPIMTAPAYVPGTTYAQGALVSYQGYVWQTKWGYITSAPGSDSAWLKVGRLAMLSFVKKSIALVAALQAVTALATPISSEAGVEKRGSGFANAVYFTNWGIYGRNFQPADLPASEITHVLYSFMNVRADGTIFSGDTYADYEKHYAGDSWNDVGTNAYGCVKQLYLLKKQNRNMKVMLSIGGWTWSTNFPAAASSAATRKTFAQSAVGFMKDWGFDGIDIDWEYPADATQAQNMVLLLQAVRSELDSYAAQYAKGHHFLLSIAAPAGPDNYNKLKFAELGKVLDYINLMAYDYAGSWSNYTGHDANIYANPQNPNATPYNTDDAVQAYINGGVPANKIVLGMPIYGRSFQQTEGIGKPYNGIGSGSWENGIWDYKALPKAGATVKCDDTAKGCYSYDPSTKELISFDTPAMISTKVSWLKGKGLGGTMFWEASASKKGSDSLISTSHQGLGSQDSTQNYLDYPNSKYDNIKKGMNMILNLIILLAISIVASASNIAAYWGQNAGGDQQTLGDYCSSSPASIIILSFLDGFPNLSLNFANQCSGTFSSGLAHCSQIGSDIKSCQQQGKTILLSLGGATGNYGFSSDSEAVQFAGTLWNKFGGGKDSERPFDDAIVDGFDFDIENKDQTGYAALATQLRKYFSTGTKSYYLSAAPQCPYPDESVGDLMSQVDLDFAFIQFYNNYCSLNQQFNWNSWSNYARGKSIKLYLGLPGSSSSAGSGFVGLSTVQRVVASIKGDSSFGGISIWDISSAENGGYLNQLYQALSGSGSPAAPSNSYQPNTPLTRTYGGSTATASAYISVGFTAGATHGSTTTNDLLAWIDSLFGSSQSSVQQYATPVQSVTATPQPVAATTTSAPKPTASAFNWFGWFDGTTTSTTLQTVYSTVPADQTVYVTLTTTVGSQMLQSLFDKRDVIAEAKSTNLQICWLLFIPLLALICSMAKRTQAILLLLLAISLIMSSSHVDGGGIAIYWGQNGNEGTLTQTCSTRKYSYVNIAFLNKFGNGQTPQINLAGHCNPAAGGCTIVSNGIRSCQIQGIKVMLSLGGGIGSYTLASQADAKNVADYLWNNFLGGKSSSRPLGDAVLDGIDFDIEHGSTLYWDDLARYLSAYSKQGKKVYLTAAPQCPFPDRYLGTALNTGLFDYVWVQFYNNPPCQYSSGNINNIINSWNRWTTSINAGKIFLGLPAAPEAAGSGYVPPDVLISRILPEIKKSPKYGGVMLWSKFYDDKNGYSSSILDSVLFLHSEECMTVLMTKLILLTGLVLILNLQLGSAYQLTCYFTNWAQYRPGLGRFMPDNIDPCLCTHLIYAFAGRQNNEITTIEWNDVTLYQAFNGLKNKNSQLKTLLAIGGWNFGTAPFTAMVSTPENRQTFITSVIKFLRQYEFDGLDFDWEYPGSRGSPPQDKHLFTVLVQEMREAFEQEAKQINKPRLMVTAAVAAGISNIQSGYEIPQLSQYLDYIHVMTYDLHGSWEGYTGENSPLYKYPTDTGSNAYLNVDYVMNYWKDNGAPAEKLIVGFPTYGHNFILSNPSNTGIGAPTSGAGPAGPYAKESGIWAYYEICTFLKNGATQGWDAPQEVPYAYQGNVWVGYDNIKSFDIKAQWLKHNKFGGAMVWAIDLDDFTGTFCNQGKFPLISTLKKALGLQSASCTAPAQPIEPITAAPSGSGNGSGSSSSGGSSGGSGFCAVRANGLYPVANNRNAFWHCVNGVTYQQNCQAGLVFDTSCDCCNWAMKKFINQFSASLKNNILVFLAFPFVWTSCARDNPLSSENSNISPNAAARAAVTGTTKANIKLFSFTEVNDTNPLNNLNFTLKNSGKPLVDMVVLFSANINYDAANDKVFVSNNPNVQHLLTNRAKYLKPLQDKGIKVILSILGNHDRSGIANLSTARAKAFAQELKNTCDLYNLDGVFFDDEYSAYQTPPPSGFVTPSNNAAARLAYETKQAMPNKLVTVYVYSRTSSFPTAVDGVNAGSYVDYAIHDYGGSYDLATNYPGLAKSGMVMSSQEFNQGRYATAQALRNIVTKGYGGHMIFAMDPNRSNFTSGQLPALKLIAKELYGDELVYSNTPYSKDWMKLNIFTKSMIGMGLVCSALPALAMEAWNNQQGGNKYQVIFDGKIYENAWWVSSTNCPGKAKANDATNPWRLKRTATAAEISQFGNTLSCEKSGSSSSSNSNTPASNTPANGGSATPAQGTVPSNSSVVAWNKQQGGQTWYVVFNGAVYKNAWWVASSNCPGDAKSNDASNPWRYVRAATATEISETSNPQSCTSAPQPSPDVKPAPDVKPAPDVQPAPADKSNDNYAVVAWKGQEGSSTWYVIYNGGIYKNAWWVGAANCPGDAKENDASNPWRYVRAATATEISQYGNPGSCSVKPDNNGGAVTPVDPTPETPVTPTPDNSEPSTPADSVNDYSLQAWSGQEGSEIYHVIFNGNVYKNAWWVGSKDCPRGTSAENSNNPWRLERTATAAELSQYGNPTTCEIDNGGVIVADGFQASKAYSADSIVDYNDAHYKTSVDQDAWGFVPGGDNPWKKYEPAKAWSASTVYVKGDRVVVDGQAYEALFWTQSDNPALVANQNATGSNSRPWKPLGKAQSYSNEELNNAPQFNPETLYASDTLIRFNGVNYISQSKVQKVSPSDSNPWRVFVDWTGTKERVGTPKKAWPKHVYAPYVDFTLNTIPDLAALAKNHNVNHFTLAFVVSKDANTCLPTWGTAYGMQNYAQYSKIKALREAGGDVMLSIGGANNAPLAASCKNVDDLMQHYYDIVDNLNLKVLDFDIEGTWVADQASIERRNLAVKKVQDKWKSEGKDIAIWYTLPILPTGLTPEGMNVLSDAKAKGVELAGVNVMTMDYGNAICQSANTEGQNIHGKCATSAIANLHSQLKGLHPNKSDAEIDAMMGTTPMVGVNDVQGEVFYLSDARLVMQDAQKRNLGMVGIWSIARDLPGGTNLSPEFHGLTKEQAPKYAFSEIFAPFTKQMSTPRAAASLAKKAALVALAVLAAALATAARAEQCGAQAGGARCPNCLCCSRWGWCGTTSDFCGDGCQSQCSGCGPTPTPTPPSPSDGVGSIVPRDLFERLLLHRNDGACPARGFYTYEAFLAAAAAFPAFGGTGNTETRKREVAAFLGQTSHETTGGWPTAPDGPFSWGYCFKQEQNPPSDYCQPSPEWPCAPGRKYYGRGPIQLSFNFNYGPAGRAIGVDLLSNPDLVATDATVSFKTALWFWMTPQGNKPSSHDVITGRWAPSPADAAAGRAPGYGVITNIVNGGLECGHGPDDRVANRIGFYQRYCGAFGIGTGGNLDCYNQRPFNSGSSVGLAEQMPPQKENHRTLNKMKTNLFLFLIFSLLLSLSSAEQCGRQAGGALCPNGLCCSEFGWCGNTEPYCKQPGCQSQCTPGGTPPGPTGDLSGIISSSQFDDMLKHRNDAACPARGFYTYNAFITAAKSFPGFGTTGDTATRKKEVAAFFGQTSHETTGGWATAPDGPYSWGYCFKQEQNPASDYCEPSATWPCASGKRYYGRGPMQLSWNYNYGLCGRAIGVDLLNNPDLVANDAVIAFKAAIWFWMTAQPPKPSCHAVIAGQWQPSDADRAAGRLPGYGVITNIINGGLECGRGQDGRVADRIGFYQRYCNIFGVNPGGNLDCYNQRSFVNGLLEAAIMRLCKFTALSSLLFSLLLLSASAEQCGSQAGGARCPSGLCCSKFGWCGNTNDYCGPGNCQSQCPGGPTPTPPTPPGGGDLGSIISSSMFDQMLKHRNDNACQGKGFYSYNAFINAARSFPGFGTSGDTTARKREIAAFFAQTSHETTGGWATAPDGPYAWGYCWLREQGSPGDYCTPSGQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSALWFWMTPQSPKPSCHDVIIGRWQPSAGDRAANRLPGFGVITNIINGGLECGRGTDSRVQDRIGFYRRYCSILGVSPGDNLDCGNQRSFGNGLLVDTMMRSLAVVVAVVATVAMAIGTARGSVSSIVSRAQFDRMLLHRNDGACQAKGFYTYDAFVAAAAAFPGFGTTGSADAQKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGASSDYCTPSAQWPCAPGKRYYGRGPIQLSHNYNYGPAGRAIGVDLLANPDLVATDATVGFKTAIWFWMTAQPPKPSSHAVIAGQWSPSGADRAAGRVPGFGVITNIINGGIECGHGQDSRVADRIGFYKRYCDILGVGYGNNLDCYSQRPFAMGAFALFAVLAMAVTMAVAEQCGSQAGGATCPNCLCCSRFGWCGSTSDYCGDGCQSQCAGCGGGGTPVTPTPTPSGGGGVSSIVSRALFDRMLLHRNDGACQAKGFYTYDAFVAAAGAFPGFGTTGSTDTRKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGATSNYCTPSAQWPCAPGKSYYGRGPIQLSHNYNYGPAGRAIGVDLLRNPDLVATDPTVSFKTAMWFWMTAQAPKPSSHAVITGQWSPSGTDRAAGRVPGFGVITNIVNGGIECGHGQDSRVADRIGFYKRYCDILRVGYGNNLDCYNQRPFAMRLSEFTTLFLLFSVLLLSASAEQCGSQAGGALCASGLCCSKFGWCGNTNEYCGPGNCQSQCPGGPGPSGDLGGVISNSMFDQMLNHRNDNACQGKNNFYSYNAFVTAAGSFPGFGTTGDITARKREIAAFLAQTSHETTGGWPTAPDGPYAWGYCFLREQGSPGDYCTPSSQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSAIWFWMTPQSPKPSCHDVITGRWQPSGADQAANRVPGFGVITNIINGGLECGHGSDSRVQDRIGFYRRYCGILGVSPGENLDCGNQRSFGNGLLVDIMQNCQCDTTIYCCSQHGYCGNSYDYCGPGCQAGPCWDPCEGDGTLTVSDIVTQEFWDGIASQAAANCPGKSFYTRSNFLEAVSAYPGFGTKCTDEDRKREIAAYFAHVTHETGHLCYIEERDGHANNYCQESQQYPCNPNKEYFGRGPMQLSWNYNYIDAGKELHFDGLNDPDIVGRDPIISFKTSLWFWIRKGVQYVILDPNQGFGATIRIINGGQECDGHNTAQMMARVGYYQEYCAQLGVSPGNNLPCMKKNRMMMMIWSVGVVWMLLLVGGSYGEQCGRQAGGALCPGGNCCSQFGWCGSTTDYCGPGCQSQCGGPSPAPTDLSALISRSTFDQMLKHRNDGACPAKGFYTYDAFIAAAKAYPSFGNTGDTATRKREIAAFLGQTSHETTGGWATAPDGPYAWGYCFVRERNPSTYCSATPQFPCAPGQQYYGRGPIQISWNYNYGQCGRAIGVDLLNKPDLVATDSVISFKSALWFWMTAQSPKPSSHDVITSRWTPSSADVAARRLPGYGTVTNIINGGLECGRGQDSRVQDRIGFFKRYCDLLGVGYGNNLDCYSQTPFGNSLLLSDLVTSQMRSLLILVLCFLPLAALGKVFGRCELAAAMKRHGLDNYRGYSLGNWVCAAKFESNFNTQATNRNTDGSTDYGILQINSRWWCNDGRTPGSRNLCNIPCSALLSSDITASVNCAKKIVSDGNGMNAWVAWRNRCKGTDVQAWIRGCRLMKALIVLGLVLLSVTVQGKVFERCELARTLKRLGMDGYRGISLANWMCLAKWESGYNTRATNYNAGDRSTDYGIFQINSRYWCNDGKTPGAVNACHLSCSALLQDNIADAVACAKRVVRDPQGIRAWVAWRNRCQNRDVRQYVQGCGVMKAFIVLVALACAAPAFGRTMDRCSLAREMSNLGVPRDQLNKWACIAEHESSYRTGVVGPENYNGSNDYGIFQINDYYWCAPPSGRFSYNECGLSCNALLTDDITHSVRCAQKVLSQQGWSAWSTWHYCSGWLPSIDDCFKIFSKCELARKLKSMGMDGFHGYSLANWVCMAEYESNFNTQAFNGRNSNGSSDYGIFQLNSKWWCKSNSHSSANACNIMCSKFLDDNIDDDIACAKRVVKDPNGMSAWVAWVKHCKGKDLSKYLASCNLMTKYVILLAVLAFALHCDAKRFTRCGLVQELRRLGFDETLMSNWVCLVENESGRFTDKIGKVNKNGSRDYGLFQINDKYWCSKGTTPGKDCNVTCNQLLTDDISVAATCAKKIYKRHKFDAWYGWKNHCQHGLPDISDCKVYDRCEFARILKKSGMDGYRGVSLANWVCLAKWESDFNTKAINRNVGSTDYGIFQINSRYWCNDGKTPKAVNACHISCKVLLDDDLSQDIECAKRVVRDPQGIKAWVAWRTHCQNKDVSQYIRGCKLMKAVIILGLVLLSVTVQGKIFERCELARTLKRLGLDGYRGISLANWVCLAKWESDYNTQATNYNPGDQSTDYGIFQINSHYWCNNGKTPGAVNACRISCNALLQDNIADAVTCAKRVVRDPQGIRAWVAWRNHCQNRDVSQYVQGCGVKIYEQCEAAREMKRLGLDGYDGYSLGDWVCTAKHESNFNTGATNYNRGDQSTDYGIFQINSRWWCNDGKTPNAKNACGIECSELLKADITAAVICAKRVVRDPNGMGAWVAWTKYCKGKDVSQWIKGCKLMSALWLLLGLLALMDLSESSNWGCYGNIQSLDTPGASCGIGRRHGLNYCGVRASERLAEIDMPYLLKYQPMMQTIGQKYCMDPAVIAGVLSRKSPGDKILVNMGDRTSMVQDPGSQAPTSWISESQVSQTTEVLTTRIKEIQRRFPTWTPDQYLRGGLCAYSGGAGYVRSSQDLSCDFCNDVLARAKYLKRHGFRTDCYGNVNRIDTTGASCKTAKPEGLSYCGVSASKKIAERDLQAMDRYKTIIKKVGEKLCVEPAVIAGIISRESHAGKVLKNGWGDRGNGFGLMQVDKRSHKPQGTWNGEVHITQGTTILINFIKTIQKKFPSWTKDQQLKGGISAYNAGAGNVRSYARMDIGTTHDDYANDVVARAQYYKQHGYMVPSVVFWGLIALVGTAKGSYTHSVHSMNPHVHPRLYHGCYGDIMTMETFGAPCDINNLMNCGIHGSEMFAEMDLKAIKPYRILIKEVGQRHCIDPALIAAIISRESHGGAVLQNGWDHKGQRFGLMQLDKNMYHPIGSWDSKEHLLQSVGILTERIKAMKRKFPTWNTAQQLKGGLTAFKSGMETIVTPADIDGDLVDDVLARAKFYKRHGFMGYGNIMNVETTGASWQTAQQDKLGYSGVRASHTMANTDSGRMERYRSKINSVGAKYGIDPALIAAIISEESRAGNVLHDGWGDYDSNRGAYNAWGLMQVDVNPNGGGHTARGAWDSEEHLSQGAEILVYFIGRIRNKFPGWNTEQQLKGGIAAYNMGDGNVHSYDNVDGRTTGGDYSNDVVARAQWYKTQKGFMPYGKIEDIKTSGASDVTAAQDGLKEGGWKSSHRMAEIDSNRMENYRTIINEAGRQCDVDPAVIAGIISRESRAGNQLINGWGDHGKAFGLMQIDVTPPPNGGGHTPVGTWDSLEHLIQATEILVEFIERIKTKFPRWNADQHLKGALAAYNKGEKNVESYASVDAKTTGKDYSNDVVARAQWYKSNMGFMKCLVALFLSLSLVACQYDDYDTERKNNNMLSSMNILDLLDSFGLNIKARIAHVRRVAGRIRLTLDIGLGNGDVERESEEAEGEGTDGRGGGEGEREGWGGEREGGEGEREGGEGEREGREGEREGKSSESNESPEDFIGPPVDMCAGESRRGSPSIGCIAAECCQHSFYINSLCPGSSVCCFSMDVCDRLPVPVIPPFPTDPGTLPPPPPIPDSQTTVSPNQPSSYMCHGDFMKLMPKGADQRTARQDNLAYAGVRASNKLVDNDLAELNKRKDCYVQAGKNHCIHPAVIAAIASRETRGGKLLYSTNGYGDGGRAYGIMQCDGGASGLGDICKKYPWDSCEHINQLTDIILLNYVNQMKTKHPSWPAHYQLKGGVSAYNAGVGNVQTIAGMDAGTTNDDYSNDVIARAQRLVNAHGWMLGKNDPMCLVLVLLGLTALLGICQGGTGCYGSVSRIDTTGASCRTAKPEGLSYCGVRASRTIAERDLGSMNKYKVLIKRVGEALCIEPAVIAGIISRESHAGKILKNGWGDRGNGFGLMQVDKRYHKIEGTWNGEAHIRQGTRILIDMVKKIQRKFPRWTRDQQLKGGISAYNAGVGNVRSYERMDIGTLHDDYSNDVVARAQYFKQHGYMHLMLVLLGLAALLGTSQSRTGCYGDVNRVDTTGASCKSAKPEKLNYCGVAASRKIAERDLQSMDRYKALIKKVGQKLCVDPAVIAGIISRESHAGKALRNGWGDNGNGFGLMQVDRRSHKPVGEWNGERHLMQGTEILISMIKAIQKKFPRWTKEQQLKGGISAYNAGPGNVRSYERMDIGTTHDDYANDVVARAQYYKQHGYMNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNCNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRCALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNLMEMISNNLNWFVGVVEDRMDPLKLGRVRVRVVGLHPPQRAQGDVMGIPTEKLPWMSVIQPITSAAMSGIGGSVTGPVEGTRVYGHFLDKWKTNGIVLGTYGGIVREKPNRLEGFSDPTGQYPRRLGNDTNVLNQGGEVGYDSSSNVIQDSNLDTAINPDDRPLSEIPTDDNPNMSMAEMLRRDEGLRLKVYWDTEGYPTIGIGHLIMKQPVRDMAQINKVLSKQVGREITGNPGSITMEEATTLFERDLADMQRDIKSHSKVGPVWQAVNRSRQMALENMAFQMGVGGVAKFNTMLTAMLAGDWEKAYKAGRDSLWYQQTKGRASRVTMIILTGNLESYGVEVKTPARSLSAMAATVAKSSDPADPPIPNDSRILFKEPVSSYKGEYPYVHTMETESGHIQEFDDTPGQERYRLVHPTGTYEEVSPSGRRTRKTVDNLYDITNADGNFLVAGDKKTNVGGSEIYYNMDNRLHQIDGSNTIFVRGDETKTVEGNGTILVKGNVTIIVEGNADITVKGDATTLVEGNQTNTVNGNLSWKVAGTVDWDVGGDWTEKMASMSSISSGQYTIDGSRIDIGMPPSLRKAVAAAIGGGAIAIASVLITGPSGNDGLEGVSYIPYKDIVGVWTVCHGHTGKDIMLGKTYTKAECKALLNKDLATVARQINPYIKVDIPETTRGALYSFVYNVGAGNFRTSTLLRKINQGDIKGACDQLRRWTYAGGKQWKGLMTRREIEREVCLWGQQMVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTGAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIAKFKEAGGTVREIDVMKGKTAAGGGAICAIAVMITIVMGNGNVRTNQAGLELIGNAEGCRRDPYMCPAGVWTDGIGNTHGVTPGVRKTDQQIAADWEKNILIAERCINQHFRGKDMPDNAFSAMTSAAFNMGCNSLRTYYSKARGMRVETSIHKWAQKGEWVNMCNHLPDFVNSNGVPLRGLKIRREKERQLCLTGLVNEMMQISSNGITRLKREEGERLKAYSDSRGIPTIGVGHTGKVDGNSVASGMTITAEKSSELLKEDLQWVEDAISSLVRVPLNQNQYDALCSLIFNIGKSAFAGSTVLRQLNLKNYQAAADAFLLWKKAGKDPDILLPRRRRERALFLSMQISQAGINLIKSFEGLQLKAYKAVPTEKHYTIGYGHYGSDVSPRQVITAKQAEDMLRDDVQAFVDGVNKALKVSVTQNQFDALVSFAYNVGLGAFRSSSLLEYLNEGRTALAAAEFPKWNKSGGKVYQGLINRRAQEQALFNSGTPKNVSRGTSSTKTTPKYKVKSGDNLTKIAKKHNTTVATLLKLNPSIKDPNMIRVGQTINVTGSGGKTHKVKSGDTLSKIAVDNKTTVSRLMSLNPEITNPNHIKVGQTIRLSMKVSQNGLNLIKEFEGCRLTAYKPVPWEQMYTIGWGHYGVTAGTTWTQAQADSQLEIDINNKYAPMVDAYVKGKANQNEFDALVSLAYNCGNVFVADGWAPFSHAYCASMIPKYRNAGGQVLQGLVRRRQAELNLFNKPVSSNSNQNNQTGGMIKMYLIIGLDNSGKAKHWYVSDGVSVRHVRTIRMLENYQNKWAKLNLPVDTMFIAEIEAEFGRKIDMASGEVKMVKKNDLFVDVSSHNGYDITGILEQMGTTNTIIKISESTTYLNPCLSAQVEQSNPIGFYHFARFGGDVAEAEREAQFFLDNVPMQVKYLVLDYEDDPSGDAQANTNACLRFMQMIADAGYKPIYYSYKPFTHDNVDYQQILAQFPNSLWIAGYGLNDGTANFEYFPSMDGIRWWQYSSNPFDKNIVLLDDEEDDKPKTAGTWKQDSKGWWFRRNNGSFPYNKWEKIGGVWYYFDSKGYCLTSEWLKDNEKWYYLKDNGAMATGWVLVGSEWYYMDDSGAMVTGWVKYKNNWYYMTNERGNMVSNEFIKSGKGWYFMNTNGELADNPSFTKEPDGLITVATVQGFDISSYQPSVNFAGAYSAGARFVIIKATEGTSYTNPSFSSQYNGATTATGNYFIRGGYHFAHPGETTGAAQADYFIAHGGGWSGDGITLPGMLDLESEGSNPACWGLSAASMVAWIKAFSDRYHAVTGRYPMLYTNPSWWSSCTGNSNAFVNTNPLVLANRYASAPGTIPGGWPYQTIWQNSDAYAYGGSNNFINGSIDNLKKLATGMKGIDIYSGQGSVDFNAVKESGVEVVYIKATEGLTYTDSTYKDFYDGAKNAGLKIGFYHYLRANDPTSEAEHFFNTISGLSLDCKCAIDVEVTLGQSIDQISSNVRKFADYLINKGLDVCVYTYTNFYKDNLNSTVKDLPLWIAEYGVSKPNIDASYVGFQYSDSGSVNGISGSADLDEFSEGILVGGTVVIDPGQGGDDNIKAIQQDLNILLKRGLEVDGIEGPETEAAIKDFQSIMGLTVDGIWGTNTSGAAQQIFSRPLDGVAYPHYEYATRYIQYRVGASVDGTFGSGTKAKVAAWQSNQGLMADGVVGSATWSKLLDENKLGIDVSQPTSTSSFTCLRNKGFTTMVIVRAWKSTGSFDTNAPQTLKNANAAGFSIENSDVYYYPCISCGNMAGQVRTFWQKVGQYSLKVKRVWFDIEGTWTSSVSTNQNYLMQMMNEARAIGIVHGIYGSKYYWGNLFGSSYKYRYRSSTPLWYPHYDNSPSFSDFSSFGGWTSPSMKQYRGDVSVCSAGVDYNYKPMPAYSSLARRGRRPAVVLLGGLVSASLALTLAPTAAAAPLAPPPGKDVGPGEAYMGVGTRIEQGLGAGPDERTIGPADTSGVQGIDVSHWQGSINWSSVKSAGMSFAYIKATEGTNYKDDRFSANYTNAYNAGIIRGAYHFARPNASSGTAQADYFASNGGGWSRDNRTLPGVLDIEHNPSGAMCYGLSTTQMRTWINDFHARYKARTTRDVVIYTTASWWNTCTGSWNGMAAKSPFWVAHWGVSAPTVPSGFPTWTFWQYSATGRVGGVSGDVDRNKFNGSAARLLALANNTAMTKTYGVDVAVYQPIDLAAYHKAGASFAIVKLTEGVDYVNRRGPSRWTAPGLTTSTLMPTISRSFGSSVSRAKKEAAYFLKEAKKQDISKKRMLWLDWEAGSGNVVTGSKSSNTAAILDFMDAIKAAGWRPGLYSGASLMRTAIDTKQVVKKYGTCLWVASYPTMAAVSTADFGYFRQWTGSPSGSLPVTAWPGRRRERCSGMQLRITSRKKLTSLLCALGLISIVAIYPRQTVNFFYSTAVQITDYIHFYGYRPVKSFAIRIPASYTIHGIDVSRWQERIDWQRVAKMRDNGIRLQFAFIKATEGEKLVDPYFSRNWQLSRENGLLRGAYHYFSPSVSASVQARLFLQTVDFSQGDFPAVLDVEERGKLSAKELRKRVSQWLKMVEKSTGKKPIIYSGAVFYHTNLAGYFNEYPWWVAHYYQRRPDNDGMAWRFWQHSDRGQVDGINGPVDFNVFNGTVEELQAFVDGIKETPMRFIALLISFFALLKVISAISGVDISSASTIESFTCLKSAGYDFAIIRAYESLGQVDPNGPHSVYNARDAGIEYVDVYMFPCPTCGNGAGQAETMVNYLKGYNANYGMVWLDIEGPQYWMSQSENVAFFESLVAGLKAEGAHIGVYTSASQWEPIMGGYTGGSEFPLWYAHYDGNPSFSDFSPFNGWSTPSVKQYDDTGDSCGLGFDLNWYPMHCAPSWKSSDERRTMLDQINTLDPNSLTALKRMSKDNSPAAIKGAAQQFEALFLQNMLKSMRDATVTSDAMGSETTRFYQGLYDQQLAAMMAQRGGIGLADVMEKQMGAQAASAQNAAAAGASSAGNVPLSLDAARAAAAHTASGDKVPTTPQAFVDATWPQAAKAAQSLGVPAHFLVAQAALETGWGKSQIRNKDGTPSYNLFNIKAGSNWTGKVVEARTVEYENGQRKVRVERFRAYDSYEQAFQDYADLVGNSPRYAKVAGKTDGHAFARALQEGGYATDPSYADKLARVINGNALRQRLMASAASARGMINKKWMKIVMIPMLVVPMYGLTSVSGQIQDSLTGENSFVKDAEAATTASQQAFIDKIAPAAQASQEQYHLLSSITLAQAILESGWGKSGLATKGYNLFGIKGKYNGQSVIMSTSEYVNGQWIKIDAEFRKYPSWNESVTDHTLLLVNGTSWNKNLYKKVVDATDYKVAAMELQKAGYASPTYGASLIQVIENYDLAKYDVLYDKILTQKSTSGKATVTSPTGNGVWTLPYKVKGVQSVSPASTYANKDIDLVSVATTKRGTYYQFKYNGKVVGWVDAKALTIYDSVNYDKVNVGRAKITSPVSNGIWSKPYNVYGREFVTNATTYAQQEIKLLREAQTAKGTYYQFSINNKTIGWIDKRALTIYPYDSIVSSKNVSLDGQITNPTGNGIWTKAYKLEGTTSVAQATKYANKDVKISQQVETQHGTYYNISIDGKAIGWLDKNAITLYDQAEYNKTVAFDAAIRNVQGNAVWTEPYRTVGTKLIGPAETYLNKEVEVVREAKTPKGTYYQFKSGGKVIGWLDKKAFEVYDNINYNKAVNLDAVVENVTGNAVWTAPYKSKGVKLVTSAATYKGKATKITREAQTSRGTYYEFSVNGKVIGWLDKKAFDVYDSIEYNKAINMTGLLSNAPGNGIWTEPYRVLDTKNIGQATAYANKTVQLVREAKTSHSTYYQMSLNGKVIGWIDKRAFTNVKMVNTQVKRVKKQKFIAGTALLLGMATFGMVGKADDLSSSNTNGGVDNSKVDNDNQESVKTSTEGVSSTTENANTVPESKVTSTVDSESAPSKTISAGTQSNISGTSDGSDSLPKTETSDSSSKPSTSNSSSKPSTSNSSSKPSTSNSSSNNNSATKPSTTTQAPPVAPSTTAPSATPSTTAPSNYYQNSSYNQTSTAAQIPNSSSDSAASVYSGPVLKKIEAAKPIEKIDSSSTEAFIKSIADRVRILAGKNNLYASIILAQAILESGSGQSNMTQQYFNIFNITGAYLGKSISFKTEEFSGNNPYYIEQSFRVYSNYDQALDDYINLMIKGTTWNSEIYAGAWKSHAKTYQEAAQALQGIFATDPEYAQKLIEIIEEYNLNFYDNVDSTTQVLDSNIPESPLVASKLDSSTYPDYNGVEYPGADSYAFGNCTQYVYNRIIQLGGQIGTHMGNGGEWGINAQAQGYFTTTVPTEGYAVSFPPGVAGSSPEYGHVAFVEKVYPDNSILVSEMNVKGNNIVSERHISAGVAALATYIQPKMNRNRLSCLIVGAVIGAGAIVCTTNTKVHAKPVNEVKNINTSKGNSFGEIISSEDIGLRKGADSSHEIITSIPSGARVNIIDKMSKDWYKVSYKDFTGYLQAKDIRVLGDELNQDNVGLISANQLNVRTSPNENGQVIGTLHKNDKVNVLDKSIDGWYKIDFNGRRAYVSSKYVNLISYKNNEVKTEVKKEPIEGTGKVNINTALNVRQASTTNSRIIGSLKGGEKVNIISESNGFYKIEFNNSYGYVYSKYISKDGDSEKVQVVKQEEVKKEKVDESKKEAKATPKAEPVVLAVRSLNKTGIVNVSSSLNVREGAGTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESSNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSAPENTEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESNNSNQGTQTPEKPSTPESAEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKITIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSTHENSKKTGVVTASKGLNVRKEANTSSQIIGILNSGESVEIIGEENGFYKITYKGQEAYASKNYINIFDGNSNVNPGLDIGNASKTNYGVSLNEYIKLQQRNNPSNYSYSEFEKYINPAKATNKLQFLRIDKFRSVNVSGLSSRLSNKGVLTGQGQAFVNAAKAFNIDPIYLVAQCLHETGNGTSKLAKGVTITEIADESKPIYNGNGQLVGYHMIKLSKPVTVYNLFGIGAKDNSSVFPNRALILGTTYAYNRGWTSIENAIKGAAEFVSLNYVHSSRYSQNTLYKMRYNQNVSNIWHQYATTPWYASSIADIMRSYQDLYLENNFTFDVPVFAGMKKESMSRIERRKAQQRKKTPVQWKKSTTLFSSALIVSSVGTPVALLPVTAEATEEQPTNAEVAQAPTTETGLVETPTTETTPGTTEQPTTDSSTTTESTTESSKETPTTPSTEQPTADSTTPVESGTTDSSVAEITPVAPSATESEAAPAVTPDDEVKVPEARVASAQTFSALSPTQSPSEFIAELARCAQPIAQANDLYASVMMAQAIVESGWGASTLSKAPNYNLFGIKGSYNGQSVYMDTWEYLNGKWLVKKEPFRKYPSYMESFQDNAHVLKTTSFQAGVYYYAGAWKSNTSSYRDATAWLTGRYATDPSYNAKLNNVITAYNLTQYDTPSSGGNTGGGTVNPGTGGSNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSGSGGSNNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSNNGGSNNNQSGTNTYYTIKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFAGQKIIVKKGTSGNTGGSSNGGSNNNQSGTNTYYTIKSGDTLNKISAQFGVSVANLQAWNNISGSLIFAGQKIIVKKGANSGSTNTNKPTNNGGGATTSYTIKSGDTLNKISAQFGVSVANLRSWNGIKGDLIFAGQTIIVKKGASAGGNASSTNSASGKRHTVKSGDSLWGLSMQYGISIQKIKQLNGLSGDTIYIGQTLKVGMKKRLIAPMLLSAASLAFFAMSGSAQAAAYTDYSLYKVEPSNTFSTESQASQAVAKLEKDTGWDASYQASGTTTTYQISASGIHSESEAKAILSGLAKQTSITGTSSPVGSKQPYVTISSGAISGEKQANTILAKLKQETGVAGAVKAYGAAQPYMNVMTSDIADETKVKALIQSLAKQTGIKSSYQPITHTVSVTTIQSGTIVGDSRAAQIKNAFQKESGLQASLKETVKGQAYYTFTTAAISGEANAKTLLQQLKQSTGITGSYKSINQKTTVESYNVQSAYFKGLSTVKDAISQIKKNTGVSGSYQQVGKSTSYTVNMKGITKQQLQKIDTFFKKKKWHYTSSSVKKTTTSAAYQITTAKILGEQQANKAAAFFAQKKVKAAKTAAGSTAENQYQLISEETSDQAKVTKGLNILKKNQLSASAKSVKKQIADTFKITTESLLDQTKVNQALTFFKSNHISVASQKTGQTAASSYQITTEAIISQEEIDRVLTFFKQNHIAVTTSKTGQTAYTQYKIVTTQLSSKTALNNGLTYLKSKSVTPSYTTKSNTLYKISVNEQFTGNDTAAAASTKLKQLYGWTSSIVKIKNGPQIMKTNYNLSLRDMVQKQMTVSPQTDGAAYVSLTYINTATSTVTADVLNIRSTPEVSPTNVIGQFKKGDKVKVIGQINGWAKINLGWRNASSDEVVQYVDPNNFSRDSKYYFQFLKLSQTAGLSVTEVNQKVLAGKGILTGRAKAFIDAANQYSINELYLISHALLETGNGTSALANGLTYNGKTVYNMYGIGAYDSNPNYYGAKYAYEQGWFTPEAAIIGGAKFIGSSYIHNTAYNQDTLYKMRWSATATHQYATDIGWAYKQVNRMYSLYSLLDGYTLYFDVPEYRMARKKLKKRKLLISLFFLVSIPLALFVLATTLSKPIEISKETEEIDEQQVFIDSLSGHAQILYEKYHVLPSITIAQAILESDWGNSELAAKANNLFGVKGNYKGHHVTMETDEVEKGKRKTIRAKFRKYSTFFESMDDHAQLFVRGTSWNKKKYKPVLEAGNYKEAATALQTSGYATDPDYADKISAIVEKYDLDEYDEVNPSLKSVDLNASIKDSAVQDVWSKPSTDDRSIRLTSAQSYVGKDIKVVSKKQKGQSVWYQFQINDKLIGWIDDSAVEIKEATMARKLIKNLGKSKSVKRVKLLFKKIFITVFIVASIVAIFNITKYFEELYKVRDLKSTKIEYYMDVADEAGDGKVQLSWKALLAIDMVIHDEDLSNIKKKDTLDIGEKFIVEDKNDKGEKVYKVKKFNKVLSELKFDSSQKSRARKYMKDLEYTYLGNKQLDSSDEKIKFIKKLEDSAIREYIDYGILPSITIGQAILESGWGNSKLTKQSNNLFGIKADKAWKGKSVEISTSEHYNEKIVASFRSYNSLQDSVKDHSLFLINNKRYRKHGLFEAKDYISQAQALENAGYSTAEDKKGNRIYAELLIDVIRSYNLQLIDNKVETKMFFLTLPLLLGCTAATTPLTAATPPVDPLPLKVVSTDQLPKGLAKDQQLWNKVNGQKGDYKALLTAIDHSLEYLGTDKAQKDYQDYKVPGITRDRVSRSLRRFRQLVVQAKSPQALETAVKKEFQFYQSIGNDQKGNVDFTGYYEATYPASRQPTTEFRYPLYQAPADLKAWPKPHPTRAELEGADGLQASQGPLKGLELVWLRDRIQAFLVQVQGSARLGLTDGTEMTVGYAGKTAHPYTSIGKALIADGKFTLEELSLPVVLQYFEENPQDLDLYIPKNKSFVFFQETFGSPPMGNLNVPVTDERSIATDKSLMPPGALALIQTNLPYYNASQTLEFKDVSRFVLDHDTGSAIKGPGRVDIFMGTGAKAKERAGVMTGSGQLYYLLLKDNMNTPFSIDEVSFRDLPGWGQDDPRKLFPAMATILSHLRNAKPYRTGALGITAAELVSLLELAERGQVNSPEQARQFFETNSVPFRISPAQGKSGFVTAFYEPELEVSATPDDVWRYPIYRRPPELVDIDNDNRPDGFDPSYAFGKADEEGISYFPDRRAIDEGCLRGRGLEIAWARSKVDLFFVHVQGAARLVFPDGAIKRITYAAKAGHVFSPIGRLLLDRGELDPKTISMQTIRQWLADHPDEVDGVLWHNRSYIFFREADVAGLDMGPIAAAKVPLVAGRALAVDRLIHTFGLPFFIHAPTLTHLDDGKPFARLMLALDTGSAIVGPARGDIFTGSGFEAGELAGTVRNEADFYILLPRIAAERYRRMRKIQVAVFLFVGLLAACSTVPPSSAPTTCAQCQPCPACPAVTPAITPAPAPAFSRSLLPASWGDLPGWAEDDVTAAWPAFMQSCRGIASRGNAAGWRRVCELARAADGKPENDVRRFFERHLKPYAIVNGDGLVSGLVTGYYEPMLRGSRTKAKGYEQPVRGVPDDLLTIDLSAVFPELKDKRVRGRLEGNKVVPYWSRAEIAARGDKLPGKTLLYVDDAVELFFLQVQGSGRVKLADGGMVRLNYADQNGYQYQSIGKALVERGELKLEEASMQGIQAWARANPARLESLLNTNPSYVFFREVANSADGPVGALGVPLTAERSIAIDPRSVPLGSPVFLATTRPNSAVPLNRLVMAQDTGGAIKGGVRADFFWGFGKEAGDQAGRMKQSGRMWILLPTELAPKMKGRWVKYLLMGTVVAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQINHIRNSSPRLYGNQSNVYNAVQEWLRAGGDTRNMRQFGIDAWQMEGADNYGNVQFTGYYTPVIQARHTRQGEFQYPIYRMPPKRGRLPSRAEIYAGALSDKYILAYSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGHAYRSIGKVLIDRGEVKKEDMSMQAIRHWGETHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLVGRASVASDRSIIPPGTTLLAEVPLLDNNGKFNGQYELRLMVALDVGGAIKGQHFDIYQGIGPEAGHRAGWYNHYGRVWVLKTAPGAGNVFSGMKKYLFRAALCGIAAAILAACQSKSIQTFPQPDTSVINGPDRPVGIPDPAGTTVGGGGAVYTVVPHLSLPHWAAQDFAKSLQSFRLGCANLKNRQGWQDVCAQAFQTPVHSVQAKQFFERYFTPWQVAGNGSLAGTVTGYYEPVLKGDDRRTAQARFPIYGIPDDFISVPLPAGLRSGKALVRIRQTGKNSGTIDNTGGTHTADLSQFPITARTTAIKGRFEGSRFLPYHTRNQINGGALDGKAPILGYAEDPVELFFMHIQGSGRLKTPSGKYIRIGYADKNEHPYVSIGRYMADKGYLKLGQTSMQGIKAYMQQNPQRLAEVLGQNPSYIFFRELTGSSNDGPVGALGTPLMGEYAGAVDRHYITLGAPLFVATAHPVTRKALNRLIMAQDTGSAIKGAVRVDYFWGYGDEAGELAGKQKTTGYVWQLLPNGMKPEYRPMKFPFHPWRRLLLCALPFAALLTACDDGKKEPPPTPAEVTTYNSVPWDALPATSDADLLAGFNAWRSACARLAKDPVWGEPCASATTVAADPTAVRAFLQERMQVYSLRSSSNGDQGLITGYYEPVYHGSLSQGEKTPVPVYGVPDDLVVVALESVYPELKGKRLRGRLEGRVLKPYDDAATIRDNGSSAPVLAWLGDPMDLQFLQIQGSGRIQLEDGRQLRIGYGDQNGHPYKPVGRWLVEQGLVPKEEISMKRIRDWAEANPQRVSELLASNPSFVFFSLRPDSDEGPRGSLNVPLTDGYSVAIDRKVIPLGSLMWLSTTRPDDGSAVVRPVAAQDTGGAIVGEVRADLFWGTGDAAGELAGHMKQPGRLWLLWPKGAPLPASMGAMNGTSGRRLSTATRVAAMAGVLLLAACGGPSSRPGLVSRPAGVAGPVSYQRVAIEGLPGWSTDRVADALPVFRRSCERLRAVSPNSMVGPSVWGSRASDWQAACAVAARLPAFDDDAARRFFAERFQAWQVTGAGDPTGLFTGYYEAALDGSLSPSAVYSTPIYGVPLDLRMEGGKGMRVSGGRSLPYPDRAAIEEGAISGVAPVIMWARDPVDVFMLHIQGSGQVRLPDGRIQRIGYAANNGHPFVGIGAIMRDRGLGDGSSMIAIRAWLRANPAEGRALMRENPRFIFFRPIEGEGPIGAQGLPLTGGRSLAVDPSSVPLGAPVWLATSDAHGETVNRLMVAQDTGSAIKGAVRGDFFWGSGEEALYHAGGMKSAGRYWVLVPRGGRNAVAQNMKGRWAKYVATGVMLAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQVNQIRSASPRLYTNQSNVYNAVQNWLRSGGDTRTMRQFGIDAWQMEGTDNYGNVQFTGYYTPVVQARHTRQGAFQYPIYSMPPKRGRLPSRAQIYAGALSDKYILAWSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGWPYRSIGKVLIDRGEVKKEDMSMQAIREWGEKHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLIGRASVASDRSIIPPGTTLLAEVPLLDNNGKFSGQYELRLMVALDVGGAIKGQHFDIYQGIGPDAGHRAGWYNHYGRVWVLKSAPGAGNVFSGMFKRRYVTLLPLFVLLAACSSKPKPTETDTTTGTPSGGFLLEPQHNVMQMGGDFANNPNAQQFIDKMVNKHGFDRQQLQEILSQAKRLDSVLRLMDNQAPTTSVKPPSGPNGAWLRYRKKFITPDNVQNGVVFWNQYEDALNRAWQVYGVPPEIIVGIIGVETRWGRVMGKTRILDALATLSFNYPRRAEYFSGELETFLLMARDEQDDPLNLKGSFAGAMGYGQFMPSSYKQYAVDFSGDGHINLWDPVDAIGSVANYFKAHGWVKGDQVAVMANGQAPGLPNGFKTKYSISQLAAAGLTPQQPLGNHQQASLLRLDVGTGYQYWYGLPNFYTITRYNHSTHYAMAVWQLGQAVALARVQMFALTAYRLRCAAWLLATGIFLLLAGCSEAKAPTALERVQKEGVLRVITRNSPATYFQDRNGETGFEYELAKRFAERLGVELKIETADNLDDLYAQLSREGGPALAAAGLTPGREDDASVRYSHTYLDVTPQIIYRNGQQRPTRPEDLVGKRIMVLKGSSHAEQLAELKKQYPELKYEESDAVEVVDLLRMVDVGDIDLTLVDSNELAMNQVYFPNVRVAFDFGEARGLAWALPGGDDDSLMNEVNAFLDQAKKEGLLQRLKDRYYGHVDVLGYVGAYTFAQHLQQRLPRYESHFKQSGKQLDTDWRLLAAIGYQESLWQPGATSKTGVRGLMMLTNRTAQAMGVSNRLDPKQSIQGGSKYFVQIRSELPESIKEPDRSWFALAAYNIGGAHLEDARKMAEKEGLNPNKWLDVKKMLPRLAQKQWYAKTRYGYARGGETVHFVQNVRRYYDILTWVTQPQMEGSQIAESGLHLPGVNKTRPEEDSGDEKLMIGADTAKECDAMTFKLLPLAVLCAALVGCQSAQSRDARAESPATAESAAPTAEAPVSEAQEADFETWLANFRRQARGEGIDEATLARALDGLRYRPRVIELDGSQPEFVRPIWEYLDSAVSASRVKKGRERLAEYRDTVRQMTERYGVPGEVLVAIWGIESSYGDYLGDFSTLEALATLAYDGRRRDFARGELLAALRIIEAGDISPERMKGSWAGAMGHTQFIPSSFLAHAVDGDGDGRRDIWNSIADVLASTANYLDEAGWREGEPWGTEVSLPQGFDYTLTEPDIRRSSAEWAAAGVRSRDGHALPDFASASVIAPAGAQGPVFLVGHNFRVILRYNNATSYALAVATLSDAIAGRAGIQGEWPREQPALKRSEVREMQQLLDARGFDVGTPDGILGPNTRRGLRAFQREIGVTPDGFATKALLERLRRMPGLPRARMAQWHPLYSVRLAKDTMTDTQRSLRRPLLGAALSAAALGLCGLSPSLLAAGKRRVSLREEEIEPGRYRDNPQARAFIDEMVARHGFDRGMLQDWFGQAVYSATVVRLIMPPATTGRKSWRTYRSRFIEPIRINAGVRFWQDNRDTLRRAEAEFGVPASVIVGIIGVETIYGRDMGSFRVLDSLSTLAFDYPATPNREARSTLFRNQLADYLLWCRDTRTDVYSVLGSYAGAIGIPQFMPTSLREYALDYDNNGHIDLRNSPTDAIGSVARFLQLHGWEPGRPVVWRIAPDDGSLGVATAAADGEPWPTRTLNQLTRAGLRVDEPINLAREGETGVLVVDLPTPDQPTEYLLGLRNFYVLTRYNRSFFYALAVYQLGEAVKAAMGMFGILNRREMLRGTAATLLLPGILTSAHAGQVAEDPLLRYPWLAQWAGADGLDAPWLRGVFQNLKKYPRVIRAMNHQAEAKPFYLYREHVTSPWLYKKGREAWQQHRAMLEAAGARYGVDAPFVLALWGMESRFGRNQGEHPVLRTLFTLAVDYPRRQTFFRQELRHFLILCRQQGWDPMLLKGSYAGAMGHVQMIPSSLRYYAVDGDGDGRLDVFNNPMDATASIAHYLGKHGWELGGPYLIPVYGITDLSAIKSAKVKEMQPWSSWYALGVRTRGEPPPAERAMALIALEEQDGLRYYGVFNNFRVILDWNRSTRFAKVVGELAEGFVLMPTPATRASLIGLALASGLLAGPARADFQSCLAGIQAQAAGAGVSAQTFRAATANIAYDDKVIELSQAQPEFKTPIWDYMSALVDEERVEDGRAAMRQHAQALANAEARYGVDRHTIAAVWGVESNFGKNLGKMPLVQSLATLACSSNRRRDFFRSELIATLKIIERGDIEASRLTGSWAGAFGQTQFMPTTYQRLAVDGDGDGRRDVVDSVADAVASTANFLRVAKWSNGQPWGYEVRLPRGFNVAAAGRKNKHAVGHWASLGVTRVDGKALTGDGPAGIIAPAGINGPAFLVTKNFDAIYSYNAAESYGLAIAVLSDRLRGRPGVQADWPTDDPPLSRAERRDLQTRLTARGYDVGEPDGKVGSKTREAIKEIERQLGMPATGRPGGKVLEALRRGMFKYSFIAVIVSTVLLSACADSHQKSAEKKPVTSEIANIATSAPARWKQIDVVSLEQAFPKQSRTPAQFPAYVDALKQKAAELGYKPETINFAFSEIHFIDRVVKSDRNQPEKKITLDVYLPRVVTKGRIAEGAKLYQANQQTLAQISNQYGVPANYIVALWGLESGFGRVQGKEDVISALATLAFEGRREALFSRQLMAALEIIENGHLPVGQRLKGSWAGAMGQTQFMPSSFLTYAADGNGDGNIDIWNSREDAFASAANYLATEGWQRDLPWGEQVSLPANFNQQLEGIKTEQQKTVAQWKALGVQLPANSQLSDDMKVWLIIPDDDLHRSYLVTQNFRTIMHWNSSYFFALSIVTMADGVANKINTLPTQHMKKESRPAFDAAAVFDAAAVPVSDSGFAANANVRRFVDDEVGKGDFSRAEWQDFFDKAAYKADIVKIMHRPSTSRPWYVFRTGNSGKAKFRGARRFYAENRALIDDVAQKYGVPAELIVAVIGIETNYGKNTGSFRVADALATLGFDYPRRAGFFQKELVELLKLAKEEGGDVFAFKGSYAGAMGMPQFMPSSYRKWAVDYDGDGHRDIWGNIGDVAASVANYMKQHGWRTGGKILVSATLAPGADVQAIIGEKTALTRTVADLKAYGIIPGEELADDEKAVLFKLETAPGVFEYYLGLNNFYTVWQYNHSRMYVTAVRDIANSLGGSGLMASSSSSKQAKPIHRMAWRLGVSLTLLLGLGALFVLPKFDPKSLTWPTTEPGRIAPLAMSGGNPYLRALMRTISASESNDASPYTVLYGGSHIENLQEHPDRCIPIRWGPNQGLCTTAAGRYQFITTTWLETAEKYHPAPTGEWMWRRYSFAPEYQDRVVYAWLDDVNYWGTDIPQLLEDGQLQTVLKRLSGTWTSLGYGIESNKVTPHLMHIYERMLAEEIALANGLPTNYLPTVANQSVETTRMIIQHSQPKRKGTKYRLKKPYKLVFNLIIVVGLIGLVYSFKKNTQPLVNPSLVTHLPELEMSGGDPYIRALMLTISASESNHKNSYYLLYGGSHVHNLQQHPDQCIPINIGPNRGNCSTAAGRYQFLNSTWQEKARKYHPNPQKNYRQYIYSFEPKYQDIVVYRWLKDHHQWNVDLLTLLKQDQVEEVLRKLSNVWTSLGGGIEDNSMTPHLPSIYRYFLAQELNRENADQNSLMVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTAAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIVKFKEAGGTVREIEVMGYTWKGLAKQYGFTDFSPATQDKAAVALILAKKGAMEAILNGDYEQAVMKLGGIWASFPTAPNEYRQHKRSWGFVHNFFRQRGFMARISAADAGGVNVIAFLDMLAWSEGTSTIKASDYGYDVLVGGKLFSEYSKHPRVKVWLPKYSIYSSAAGRYQFLAGTWDAIVKNYGFKGRFIPEAQDLAAIKLLTECGALPLIKAGRIVEAIAKAAPIWASLPGAGYGQREHKLAALLGIYEAERAAEAKPQDQLLAMFSACGGEMAAMTRYEFALLALAAVGYVVWRDWQRSEEPGAQSPDFIDQAENLFYDATEGNFFGGTEDTDMGQAQLNRAAFLLTIRTGEGTAGNDGYRMLFGGGKFDSFADHPRQVVTALSNGKPISSSAAGAYQFLRRTWDTLAARLGLTDFSPASQDAAALELIREAGALGDVDAGRFALAVRKVRKIWASMPGAGYGQPEVALERLQAAYQAAGGVVNGMPVINTHQNIAAFLDMLAYSEGTANHPLTKNRGYDVIVTSLDGRPEIFTDYSDHPFAHGRPAKVFNRRGEKSTASGRYQQLYMFWPHYKKQLALPDFSPLSQDKLAIQLIRERGAIDDIRAGRIERAVSRCRNIWASLPGAGYGQREHSLEKLVTVWRTAGGVVAMYSQQVQQINQPQKNSDIQLINMWLQQIHPIQQNSHLYIAQMFLKFIKKPLKKVTSADVIAFANVYGVRSHNSHSNQQKRIETINSLLKFGQEAGILPRNQKKTFSPNTTNFKTSVYSQNKIKNYRTTGKQQKKPLNWSQLFNLQLASSVLIVFILLMAILQLFRQVSGSTNANQNKSVTSVVMPKIDPTKNWAYPVNVPRIRAFLDTIAVTEGTTGPKGYYRQYTGSHFLSFEDHPRELKCANSNGKKLCSDAAGRYQFLSTSWDRFAPVVKAQNFSPTYQDRVAIELIRDKNALKDIEEGRVKEAFQKLYMVWPSFGETETDVEQLMPKLVGTYEQKLALYQIKNMDDEFERAFKKILDYEGGYSDEQKDHGGKTKYGITEKLARDYGHEGEMKDLELEKAKEIYYREFWANHLYSWIEDERIATEVFEQAVNMGAKTANKHLQKAYNLLADKEIAVDGIIGQRTLEAVNNFEHNSDLFKLLNILQAKKYINIVKNDASQQKFIRGWLRRVELDIDSRKSMKRNFQTVMPYIFSEEGGYADNPADPGGATNMGITINTLSAWEGRQVSPQDVKELTQATATQIYQVEFWNKIDGNDLPSGVDYALFDFAVNSGPGRAAKTLQKILAMPEDGIIGAQTVAAAAARSPEGIINALCDARAAWLRGLSTAATFGNGWLARVERVRARALALAATPPAITQPADPAGNPSPKARQADIAFTSALKHPEALGTMGSVASGLAAIATGNGPVQYALAIVMVACAGVGLWYFVRRVRSEPMNFDQAFDRLLGHEGGYSNNSADPGGETMWGVTARVARADGYLGEMRDLPRDRAKSIYRRLYWTPVRADELPEVVRFDVFDGAVNSGPAQSIKWLQRAAGAVDDGILGPRTMAAAVAAGPVLAARYNGHRLLFLADRPTWGSFGKGWARRVGKNLLGAMDQPPWLQAAWAEFGVREIPGKEDAPEILRYFRDAGDTNVETEATPWCAAFLGAMLKRAGYAGTGSLLARSYLDWGDRLDDARFGAVAVLSRGDDPNAGHVGFLLSDTNGKLYLLGGNQGDAVTVASFDKARLLGLRWPKENVEAASKGDDAIFSRVLAHVLEMEGGFSNDPYDPGGPTNRGITLEVYAKFRKETLDDGTRARLIAELKRIPDAIVTAIYRQRYFDPASCPVFTAPLALMHFDAAVNHGVGAAIRMLQGVAGVTVDGEIGPETLAAIGAKSLADLLDDYAETRRARYRALPHFWRFGRGWLKRVDATLALARTWAAAEATNRGLIEPQQIAKGEGKMGEKSKTEISSSDDSKWWLNSKTMWGTLITAAATVIPVLGPAVGIVLPADLITSFGDQVVTAAQALAGLFGTALAIYGRLKADTPLVLRKNMSAPLTFQQVFDRVVGHEGGYVNDPHDPGGETNWGITKYTARENGYTGSMKAMTREQAYKIYEKAFWQRYHCEKLPEAVAFQFFDAAVNHGVGNASRMLQRAVNVADDGIIGKVTLSAVEKMPISDLLLRFNAERIRFYTKLKNFPRYGKGWMNRIAGNLAYAAIDNEVMNPIIDGIIALEGGYVFNPKDKGGATHWGITEATARAHGYAGDMRDLTHAEAYAILEEDYWIKPGFDVISTLSWPVSFELCDAAVNIGAYHPSAWLQRWLNVFNHEGKRYPDIHVDGNIGPRTLAALEHYLAWRGQEGEAVLVKALNCSQGTYYLNVAEKNHNNEQFIYGWIKNRVTMDSFEDAFKALIGNEGGYSFNPADPGGETMWGVTARVARSEGYNGAMKDLPLETAHQIAKRRYWDPLHLDELDPRVAFQIFDANYNGGLVVLWMQKASGAKEDGKFGPDTLDAVKNADPMKFVMRFAAYRLRYLRNLHSWPSFSRGWTERMAANLLLGAAMSQTATLSDFNKAFDRVIQHEGGYVNDPRDAGGETKFGITIHTARANGYTGSMFTMTRDDAKQIYLKAFWQRYRCNEFPPELAFQFFDACVNHGSGNASRMLQRAVGVVDDGIIGEITLAAIRKRSTVEVVTLFNAERLEFYTKLSGFQHFGKGWIRRMAGNLRHIADDVGDK']
Target names: '18', '19', '22', '23', '24', '25', '73', '102', '103', '104', '108'
In [ ]:
sequence_data
Out[ ]:
{'DESCR': 'Sequences',
'data': ['MRKFNKPLLALLIGSTLCSAAQAAAPGKPTIAWGNTKFAIVEVDQAATAYNNLVKVKNAADVSVSWNLWNGDAGTTAKILLNGKEAWSGPSTGSSGTANFKVNKGGRYQMQVALCNADGCTASDATEIVVADTDGSHLAPLKEPLLEKNKPYKQNSGKVVGSYFVEWGVYGRNFTVDKIPAQNLTHLLYGFIPICGGNGINDSLKEIEGSFQALQRSCQGREDFKVSIHDPFAALQKAQKGVTAWDDPYKGNFGQLMALKQAHPDLKILPSIGGWTLSDPFFFMGDKVKRDRFVGSVKEFLQTWKFFDGVDIDWEFPGGKGANPNLGSPQDGETYVLLMKELRAMLDQLSAETGRKYELTSAISAGKDKIDKVAYNVAQNSMDHIFLMSYDFYGPFDLKNLGHQTALNAPAWKPDTAYTTVNGVNALLAQGVKPGKVVVGTAMYGRGWTGVNGYQNNIPFTGTATGPVKGTWKNGIVDYRQIAGQFMSGEWQYTYDATAEAPYVFKPSTGDLITFDDARSVQAKGKYVLDKQLGGLFSWEIDADNGDILNSMNASLGNSAGVQ',
'MSTRKAVIGYYFIPTNQINNYTETDTSVVPFPVSNITPAKAKQLTHINFSFLDINSNLECAWDPATNDAKARDVVNRLTALKAHNPSLRIMFSIGGWYYSNDLGVSHANYVNAVKTPAARTKFAQSCVRIMKDYGFDGVDIDWEYPQAAEVDGFIAALQEIRTLLNQQTIADGRQALPYQLTIAGAGGAFFLSRYYSKLAQIVAPLDYINLMTYDLAGPWEKITNHQAALFGDAAGPTFYNALREANLGWSWEELTRAFPSPFSLTVDAAVQQHLMMEGVPSAKIVMGVPFYGRAFKGVSGGNGGQYSSHSTPGEDPYPNADYWLVGCDECVRDKDPRIASYRQLEQMLQGNYGYQRLWNDKTKTPYLYHAQNGLFVTYDDAESFKYKAKYIKQQQLGGVMFWHLGQDNRNGDLLAALDRYFNAADYDDSQLDMGTGLRYTGVGPGNLPIMTAPAYVPGTTYAQGALVSYQGYVWQTKWGYITSAPGSDSAWLKVGRLA',
'MLSFVKKSIALVAALQAVTALATPISSEAGVEKRGSGFANAVYFTNWGIYGRNFQPADLPASEITHVLYSFMNVRADGTIFSGDTYADYEKHYAGDSWNDVGTNAYGCVKQLYLLKKQNRNMKVMLSIGGWTWSTNFPAAASSAATRKTFAQSAVGFMKDWGFDGIDIDWEYPADATQAQNMVLLLQAVRSELDSYAAQYAKGHHFLLSIAAPAGPDNYNKLKFAELGKVLDYINLMAYDYAGSWSNYTGHDANIYANPQNPNATPYNTDDAVQAYINGGVPANKIVLGMPIYGRSFQQTEGIGKPYNGIGSGSWENGIWDYKALPKAGATVKCDDTAKGCYSYDPSTKELISFDTPAMISTKVSWLKGKGLGGTMFWEASASKKGSDSLISTSHQGLGSQDSTQNYLDYPNSKYDNIKKGMN',
'MILNLIILLAISIVASASNIAAYWGQNAGGDQQTLGDYCSSSPASIIILSFLDGFPNLSLNFANQCSGTFSSGLAHCSQIGSDIKSCQQQGKTILLSLGGATGNYGFSSDSEAVQFAGTLWNKFGGGKDSERPFDDAIVDGFDFDIENKDQTGYAALATQLRKYFSTGTKSYYLSAAPQCPYPDESVGDLMSQVDLDFAFIQFYNNYCSLNQQFNWNSWSNYARGKSIKLYLGLPGSSSSAGSGFVGLSTVQRVVASIKGDSSFGGISIWDISSAENGGYLNQLYQALSGSGSPAAPSNSYQPNTPLTRTYGGSTATASAYISVGFTAGATHGSTTTNDLLAWIDSLFGSSQSSVQQYATPVQSVTATPQPVAATTTSAPKPTASAFNWFGWFDGTTTSTTLQTVYSTVPADQTVYVTLTTTVGSQMLQSLFDKRDVIAEAKSTNLQICWLLFIPLLALICS',
'MAKRTQAILLLLLAISLIMSSSHVDGGGIAIYWGQNGNEGTLTQTCSTRKYSYVNIAFLNKFGNGQTPQINLAGHCNPAAGGCTIVSNGIRSCQIQGIKVMLSLGGGIGSYTLASQADAKNVADYLWNNFLGGKSSSRPLGDAVLDGIDFDIEHGSTLYWDDLARYLSAYSKQGKKVYLTAAPQCPFPDRYLGTALNTGLFDYVWVQFYNNPPCQYSSGNINNIINSWNRWTTSINAGKIFLGLPAAPEAAGSGYVPPDVLISRILPEIKKSPKYGGVMLWSKFYDDKNGYSSSILDSVLFLHSEECMTVL',
'MTKLILLTGLVLILNLQLGSAYQLTCYFTNWAQYRPGLGRFMPDNIDPCLCTHLIYAFAGRQNNEITTIEWNDVTLYQAFNGLKNKNSQLKTLLAIGGWNFGTAPFTAMVSTPENRQTFITSVIKFLRQYEFDGLDFDWEYPGSRGSPPQDKHLFTVLVQEMREAFEQEAKQINKPRLMVTAAVAAGISNIQSGYEIPQLSQYLDYIHVMTYDLHGSWEGYTGENSPLYKYPTDTGSNAYLNVDYVMNYWKDNGAPAEKLIVGFPTYGHNFILSNPSNTGIGAPTSGAGPAGPYAKESGIWAYYEICTFLKNGATQGWDAPQEVPYAYQGNVWVGYDNIKSFDIKAQWLKHNKFGGAMVWAIDLDDFTGTFCNQGKFPLISTLKKALGLQSASCTAPAQPIEPITAAPSGSGNGSGSSSSGGSSGGSGFCAVRANGLYPVANNRNAFWHCVNGVTYQQNCQAGLVFDTSCDCCNWA',
'MKKFINQFSASLKNNILVFLAFPFVWTSCARDNPLSSENSNISPNAAARAAVTGTTKANIKLFSFTEVNDTNPLNNLNFTLKNSGKPLVDMVVLFSANINYDAANDKVFVSNNPNVQHLLTNRAKYLKPLQDKGIKVILSILGNHDRSGIANLSTARAKAFAQELKNTCDLYNLDGVFFDDEYSAYQTPPPSGFVTPSNNAAARLAYETKQAMPNKLVTVYVYSRTSSFPTAVDGVNAGSYVDYAIHDYGGSYDLATNYPGLAKSGMVMSSQEFNQGRYATAQALRNIVTKGYGGHMIFAMDPNRSNFTSGQLPALKLIAKELYGDELVYSNTPYSKDW',
'MKLNIFTKSMIGMGLVCSALPALAMEAWNNQQGGNKYQVIFDGKIYENAWWVSSTNCPGKAKANDATNPWRLKRTATAAEISQFGNTLSCEKSGSSSSSNSNTPASNTPANGGSATPAQGTVPSNSSVVAWNKQQGGQTWYVVFNGAVYKNAWWVASSNCPGDAKSNDASNPWRYVRAATATEISETSNPQSCTSAPQPSPDVKPAPDVKPAPDVQPAPADKSNDNYAVVAWKGQEGSSTWYVIYNGGIYKNAWWVGAANCPGDAKENDASNPWRYVRAATATEISQYGNPGSCSVKPDNNGGAVTPVDPTPETPVTPTPDNSEPSTPADSVNDYSLQAWSGQEGSEIYHVIFNGNVYKNAWWVGSKDCPRGTSAENSNNPWRLERTATAAELSQYGNPTTCEIDNGGVIVADGFQASKAYSADSIVDYNDAHYKTSVDQDAWGFVPGGDNPWKKYEPAKAWSASTVYVKGDRVVVDGQAYEALFWTQSDNPALVANQNATGSNSRPWKPLGKAQSYSNEELNNAPQFNPETLYASDTLIRFNGVNYISQSKVQKVSPSDSNPWRVFVDWTGTKERVGTPKKAWPKHVYAPYVDFTLNTIPDLAALAKNHNVNHFTLAFVVSKDANTCLPTWGTAYGMQNYAQYSKIKALREAGGDVMLSIGGANNAPLAASCKNVDDLMQHYYDIVDNLNLKVLDFDIEGTWVADQASIERRNLAVKKVQDKWKSEGKDIAIWYTLPILPTGLTPEGMNVLSDAKAKGVELAGVNVMTMDYGNAICQSANTEGQNIHGKCATSAIANLHSQLKGLHPNKSDAEIDAMMGTTPMVGVNDVQGEVFYLSDARLVMQDAQKRNLGMVGIWSIARDLPGGTNLSPEFHGLTKEQAPKYAFSEIFAPFTKQ',
'MSTPRAAASLAKKAALVALAVLAAALATAARAEQCGAQAGGARCPNCLCCSRWGWCGTTSDFCGDGCQSQCSGCGPTPTPTPPSPSDGVGSIVPRDLFERLLLHRNDGACPARGFYTYEAFLAAAAAFPAFGGTGNTETRKREVAAFLGQTSHETTGGWPTAPDGPFSWGYCFKQEQNPPSDYCQPSPEWPCAPGRKYYGRGPIQLSFNFNYGPAGRAIGVDLLSNPDLVATDATVSFKTALWFWMTPQGNKPSSHDVITGRWAPSPADAAAGRAPGYGVITNIVNGGLECGHGPDDRVANRIGFYQRYCGAFGIGTGGNLDCYNQRPFNSGSSVGLAEQ',
'MPPQKENHRTLNKMKTNLFLFLIFSLLLSLSSAEQCGRQAGGALCPNGLCCSEFGWCGNTEPYCKQPGCQSQCTPGGTPPGPTGDLSGIISSSQFDDMLKHRNDAACPARGFYTYNAFITAAKSFPGFGTTGDTATRKKEVAAFFGQTSHETTGGWATAPDGPYSWGYCFKQEQNPASDYCEPSATWPCASGKRYYGRGPMQLSWNYNYGLCGRAIGVDLLNNPDLVANDAVIAFKAAIWFWMTAQPPKPSCHAVIAGQWQPSDADRAAGRLPGYGVITNIINGGLECGRGQDGRVADRIGFYQRYCNIFGVNPGGNLDCYNQRSFVNGLLEAAI',
'MRLCKFTALSSLLFSLLLLSASAEQCGSQAGGARCPSGLCCSKFGWCGNTNDYCGPGNCQSQCPGGPTPTPPTPPGGGDLGSIISSSMFDQMLKHRNDNACQGKGFYSYNAFINAARSFPGFGTSGDTTARKREIAAFFAQTSHETTGGWATAPDGPYAWGYCWLREQGSPGDYCTPSGQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSALWFWMTPQSPKPSCHDVIIGRWQPSAGDRAANRLPGFGVITNIINGGLECGRGTDSRVQDRIGFYRRYCSILGVSPGDNLDCGNQRSFGNGLLVDTM',
'MRSLAVVVAVVATVAMAIGTARGSVSSIVSRAQFDRMLLHRNDGACQAKGFYTYDAFVAAAAAFPGFGTTGSADAQKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGASSDYCTPSAQWPCAPGKRYYGRGPIQLSHNYNYGPAGRAIGVDLLANPDLVATDATVGFKTAIWFWMTAQPPKPSSHAVIAGQWSPSGADRAAGRVPGFGVITNIINGGIECGHGQDSRVADRIGFYKRYCDILGVGYGNNLDCYSQRPFA',
'MGAFALFAVLAMAVTMAVAEQCGSQAGGATCPNCLCCSRFGWCGSTSDYCGDGCQSQCAGCGGGGTPVTPTPTPSGGGGVSSIVSRALFDRMLLHRNDGACQAKGFYTYDAFVAAAGAFPGFGTTGSTDTRKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGATSNYCTPSAQWPCAPGKSYYGRGPIQLSHNYNYGPAGRAIGVDLLRNPDLVATDPTVSFKTAMWFWMTAQAPKPSSHAVITGQWSPSGTDRAAGRVPGFGVITNIVNGGIECGHGQDSRVADRIGFYKRYCDILRVGYGNNLDCYNQRPFA',
'MRLSEFTTLFLLFSVLLLSASAEQCGSQAGGALCASGLCCSKFGWCGNTNEYCGPGNCQSQCPGGPGPSGDLGGVISNSMFDQMLNHRNDNACQGKNNFYSYNAFVTAAGSFPGFGTTGDITARKREIAAFLAQTSHETTGGWPTAPDGPYAWGYCFLREQGSPGDYCTPSSQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSAIWFWMTPQSPKPSCHDVITGRWQPSGADQAANRVPGFGVITNIINGGLECGHGSDSRVQDRIGFYRRYCGILGVSPGENLDCGNQRSFGNGLLVDIM',
'QNCQCDTTIYCCSQHGYCGNSYDYCGPGCQAGPCWDPCEGDGTLTVSDIVTQEFWDGIASQAAANCPGKSFYTRSNFLEAVSAYPGFGTKCTDEDRKREIAAYFAHVTHETGHLCYIEERDGHANNYCQESQQYPCNPNKEYFGRGPMQLSWNYNYIDAGKELHFDGLNDPDIVGRDPIISFKTSLWFWIRKGVQYVILDPNQGFGATIRIINGGQECDGHNTAQMMARVGYYQEYCAQLGVSPGNNLPC',
'MKKNRMMMMIWSVGVVWMLLLVGGSYGEQCGRQAGGALCPGGNCCSQFGWCGSTTDYCGPGCQSQCGGPSPAPTDLSALISRSTFDQMLKHRNDGACPAKGFYTYDAFIAAAKAYPSFGNTGDTATRKREIAAFLGQTSHETTGGWATAPDGPYAWGYCFVRERNPSTYCSATPQFPCAPGQQYYGRGPIQISWNYNYGQCGRAIGVDLLNKPDLVATDSVISFKSALWFWMTAQSPKPSSHDVITSRWTPSSADVAARRLPGYGTVTNIINGGLECGRGQDSRVQDRIGFFKRYCDLLGVGYGNNLDCYSQTPFGNSLLLSDLVTSQ',
'MRSLLILVLCFLPLAALGKVFGRCELAAAMKRHGLDNYRGYSLGNWVCAAKFESNFNTQATNRNTDGSTDYGILQINSRWWCNDGRTPGSRNLCNIPCSALLSSDITASVNCAKKIVSDGNGMNAWVAWRNRCKGTDVQAWIRGCRL',
'MKALIVLGLVLLSVTVQGKVFERCELARTLKRLGMDGYRGISLANWMCLAKWESGYNTRATNYNAGDRSTDYGIFQINSRYWCNDGKTPGAVNACHLSCSALLQDNIADAVACAKRVVRDPQGIRAWVAWRNRCQNRDVRQYVQGCGV',
'MKAFIVLVALACAAPAFGRTMDRCSLAREMSNLGVPRDQLNKWACIAEHESSYRTGVVGPENYNGSNDYGIFQINDYYWCAPPSGRFSYNECGLSCNALLTDDITHSVRCAQKVLSQQGWSAWSTWHYCSGWLPSIDDCF',
'KIFSKCELARKLKSMGMDGFHGYSLANWVCMAEYESNFNTQAFNGRNSNGSSDYGIFQLNSKWWCKSNSHSSANACNIMCSKFLDDNIDDDIACAKRVVKDPNGMSAWVAWVKHCKGKDLSKYLASCNL',
'MTKYVILLAVLAFALHCDAKRFTRCGLVQELRRLGFDETLMSNWVCLVENESGRFTDKIGKVNKNGSRDYGLFQINDKYWCSKGTTPGKDCNVTCNQLLTDDISVAATCAKKIYKRHKFDAWYGWKNHCQHGLPDISDC',
'KVYDRCEFARILKKSGMDGYRGVSLANWVCLAKWESDFNTKAINRNVGSTDYGIFQINSRYWCNDGKTPKAVNACHISCKVLLDDDLSQDIECAKRVVRDPQGIKAWVAWRTHCQNKDVSQYIRGCKL',
'MKAVIILGLVLLSVTVQGKIFERCELARTLKRLGLDGYRGISLANWVCLAKWESDYNTQATNYNPGDQSTDYGIFQINSHYWCNNGKTPGAVNACRISCNALLQDNIADAVTCAKRVVRDPQGIRAWVAWRNHCQNRDVSQYVQGCGV',
'KIYEQCEAAREMKRLGLDGYDGYSLGDWVCTAKHESNFNTGATNYNRGDQSTDYGIFQINSRWWCNDGKTPNAKNACGIECSELLKADITAAVICAKRVVRDPNGMGAWVAWTKYCKGKDVSQWIKGCKL',
'MSALWLLLGLLALMDLSESSNWGCYGNIQSLDTPGASCGIGRRHGLNYCGVRASERLAEIDMPYLLKYQPMMQTIGQKYCMDPAVIAGVLSRKSPGDKILVNMGDRTSMVQDPGSQAPTSWISESQVSQTTEVLTTRIKEIQRRFPTWTPDQYLRGGLCAYSGGAGYVRSSQDLSCDFCNDVLARAKYLKRHGF',
'RTDCYGNVNRIDTTGASCKTAKPEGLSYCGVSASKKIAERDLQAMDRYKTIIKKVGEKLCVEPAVIAGIISRESHAGKVLKNGWGDRGNGFGLMQVDKRSHKPQGTWNGEVHITQGTTILINFIKTIQKKFPSWTKDQQLKGGISAYNAGAGNVRSYARMDIGTTHDDYANDVVARAQYYKQHGY',
'MVPSVVFWGLIALVGTAKGSYTHSVHSMNPHVHPRLYHGCYGDIMTMETFGAPCDINNLMNCGIHGSEMFAEMDLKAIKPYRILIKEVGQRHCIDPALIAAIISRESHGGAVLQNGWDHKGQRFGLMQLDKNMYHPIGSWDSKEHLLQSVGILTERIKAMKRKFPTWNTAQQLKGGLTAFKSGMETIVTPADIDGDLVDDVLARAKFYKRHGF',
'MGYGNIMNVETTGASWQTAQQDKLGYSGVRASHTMANTDSGRMERYRSKINSVGAKYGIDPALIAAIISEESRAGNVLHDGWGDYDSNRGAYNAWGLMQVDVNPNGGGHTARGAWDSEEHLSQGAEILVYFIGRIRNKFPGWNTEQQLKGGIAAYNMGDGNVHSYDNVDGRTTGGDYSNDVVARAQWYKTQKGF',
'MPYGKIEDIKTSGASDVTAAQDGLKEGGWKSSHRMAEIDSNRMENYRTIINEAGRQCDVDPAVIAGIISRESRAGNQLINGWGDHGKAFGLMQIDVTPPPNGGGHTPVGTWDSLEHLIQATEILVEFIERIKTKFPRWNADQHLKGALAAYNKGEKNVESYASVDAKTTGKDYSNDVVARAQWYKSNMGF',
'MKCLVALFLSLSLVACQYDDYDTERKNNNMLSSMNILDLLDSFGLNIKARIAHVRRVAGRIRLTLDIGLGNGDVERESEEAEGEGTDGRGGGEGEREGWGGEREGGEGEREGGEGEREGREGEREGKSSESNESPEDFIGPPVDMCAGESRRGSPSIGCIAAECCQHSFYINSLCPGSSVCCFSMDVCDRLPVPVIPPFPTDPGTLPPPPPIPDSQTTVSPNQPSSYMCHGDFMKLMPKGADQRTARQDNLAYAGVRASNKLVDNDLAELNKRKDCYVQAGKNHCIHPAVIAAIASRETRGGKLLYSTNGYGDGGRAYGIMQCDGGASGLGDICKKYPWDSCEHINQLTDIILLNYVNQMKTKHPSWPAHYQLKGGVSAYNAGVGNVQTIAGMDAGTTNDDYSNDVIARAQRLVNAHGW',
'MLGKNDPMCLVLVLLGLTALLGICQGGTGCYGSVSRIDTTGASCRTAKPEGLSYCGVRASRTIAERDLGSMNKYKVLIKRVGEALCIEPAVIAGIISRESHAGKILKNGWGDRGNGFGLMQVDKRYHKIEGTWNGEAHIRQGTRILIDMVKKIQRKFPRWTRDQQLKGGISAYNAGVGNVRSYERMDIGTLHDDYSNDVVARAQYFKQHGY',
'MHLMLVLLGLAALLGTSQSRTGCYGDVNRVDTTGASCKSAKPEKLNYCGVAASRKIAERDLQSMDRYKALIKKVGQKLCVDPAVIAGIISRESHAGKALRNGWGDNGNGFGLMQVDRRSHKPVGEWNGERHLMQGTEILISMIKAIQKKFPRWTKEQQLKGGISAYNAGPGNVRSYERMDIGTTHDDYANDVVARAQYYKQHGY',
'MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNCNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRCALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL',
'MEMISNNLNWFVGVVEDRMDPLKLGRVRVRVVGLHPPQRAQGDVMGIPTEKLPWMSVIQPITSAAMSGIGGSVTGPVEGTRVYGHFLDKWKTNGIVLGTYGGIVREKPNRLEGFSDPTGQYPRRLGNDTNVLNQGGEVGYDSSSNVIQDSNLDTAINPDDRPLSEIPTDDNPNMSMAEMLRRDEGLRLKVYWDTEGYPTIGIGHLIMKQPVRDMAQINKVLSKQVGREITGNPGSITMEEATTLFERDLADMQRDIKSHSKVGPVWQAVNRSRQMALENMAFQMGVGGVAKFNTMLTAMLAGDWEKAYKAGRDSLWYQQTKGRASRVTMIILTGNLESYGVEVKTPARSLSAMAATVAKSSDPADPPIPNDSRILFKEPVSSYKGEYPYVHTMETESGHIQEFDDTPGQERYRLVHPTGTYEEVSPSGRRTRKTVDNLYDITNADGNFLVAGDKKTNVGGSEIYYNMDNRLHQIDGSNTIFVRGDETKTVEGNGTILVKGNVTIIVEGNADITVKGDATTLVEGNQTNTVNGNLSWKVAGTVDWDVGGDWTEKMASMSSISSGQYTIDGSRIDIG',
'MPPSLRKAVAAAIGGGAIAIASVLITGPSGNDGLEGVSYIPYKDIVGVWTVCHGHTGKDIMLGKTYTKAECKALLNKDLATVARQINPYIKVDIPETTRGALYSFVYNVGAGNFRTSTLLRKINQGDIKGACDQLRRWTYAGGKQWKGLMTRREIEREVCLWGQQ',
'MVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTGAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIAKFKEAGGTVREIDV',
'MKGKTAAGGGAICAIAVMITIVMGNGNVRTNQAGLELIGNAEGCRRDPYMCPAGVWTDGIGNTHGVTPGVRKTDQQIAADWEKNILIAERCINQHFRGKDMPDNAFSAMTSAAFNMGCNSLRTYYSKARGMRVETSIHKWAQKGEWVNMCNHLPDFVNSNGVPLRGLKIRREKERQLCLTGLVNE',
'MMQISSNGITRLKREEGERLKAYSDSRGIPTIGVGHTGKVDGNSVASGMTITAEKSSELLKEDLQWVEDAISSLVRVPLNQNQYDALCSLIFNIGKSAFAGSTVLRQLNLKNYQAAADAFLLWKKAGKDPDILLPRRRRERALFLS',
'MQISQAGINLIKSFEGLQLKAYKAVPTEKHYTIGYGHYGSDVSPRQVITAKQAEDMLRDDVQAFVDGVNKALKVSVTQNQFDALVSFAYNVGLGAFRSSSLLEYLNEGRTALAAAEFPKWNKSGGKVYQGLINRRAQEQALFNSGTPKNVSRGTSSTKTTPKYKVKSGDNLTKIAKKHNTTVATLLKLNPSIKDPNMIRVGQTINVTGSGGKTHKVKSGDTLSKIAVDNKTTVSRLMSLNPEITNPNHIKVGQTIRLS',
'MKVSQNGLNLIKEFEGCRLTAYKPVPWEQMYTIGWGHYGVTAGTTWTQAQADSQLEIDINNKYAPMVDAYVKGKANQNEFDALVSLAYNCGNVFVADGWAPFSHAYCASMIPKYRNAGGQVLQGLVRRRQAELNLFNKPVSSNSNQNNQTGGMIKMYLIIGLDNSGKAKHWYVSDGVSVRHVRTIRMLENYQNKWAKLNLPVDTMFIAEIEAEFGRKIDMASGEVK',
'MVKKNDLFVDVSSHNGYDITGILEQMGTTNTIIKISESTTYLNPCLSAQVEQSNPIGFYHFARFGGDVAEAEREAQFFLDNVPMQVKYLVLDYEDDPSGDAQANTNACLRFMQMIADAGYKPIYYSYKPFTHDNVDYQQILAQFPNSLWIAGYGLNDGTANFEYFPSMDGIRWWQYSSNPFDKNIVLLDDEEDDKPKTAGTWKQDSKGWWFRRNNGSFPYNKWEKIGGVWYYFDSKGYCLTSEWLKDNEKWYYLKDNGAMATGWVLVGSEWYYMDDSGAMVTGWVKYKNNWYYMTNERGNMVSNEFIKSGKGWYFMNTNGELADNPSFTKEPDGLITVA',
'TVQGFDISSYQPSVNFAGAYSAGARFVIIKATEGTSYTNPSFSSQYNGATTATGNYFIRGGYHFAHPGETTGAAQADYFIAHGGGWSGDGITLPGMLDLESEGSNPACWGLSAASMVAWIKAFSDRYHAVTGRYPMLYTNPSWWSSCTGNSNAFVNTNPLVLANRYASAPGTIPGGWPYQTIWQNSDAYAYGGSNNFINGSIDNLKKLATG',
'MKGIDIYSGQGSVDFNAVKESGVEVVYIKATEGLTYTDSTYKDFYDGAKNAGLKIGFYHYLRANDPTSEAEHFFNTISGLSLDCKCAIDVEVTLGQSIDQISSNVRKFADYLINKGLDVCVYTYTNFYKDNLNSTVKDLPLWIAEYGVSKPNIDASYVGFQYSDSGSVNGISGSADLDEFSEGILVGGTVVIDPGQGGDDNIKAIQQDLNILLKRGLEVDGIEGPETEAAIKDFQSIMGLTVDGIWGTNTSGAAQQIFSRPLDGVAYPHYEYATRYIQYRVGASVDGTFGSGTKAKVAAWQSNQGLMADGVVGSATWSKLLDEN',
'KLGIDVSQPTSTSSFTCLRNKGFTTMVIVRAWKSTGSFDTNAPQTLKNANAAGFSIENSDVYYYPCISCGNMAGQVRTFWQKVGQYSLKVKRVWFDIEGTWTSSVSTNQNYLMQMMNEARAIGIVHGIYGSKYYWGNLFGSSYKYRYRSSTPLWYPHYDNSPSFSDFSSFGGWTSPSMKQYRGDVSVCSAGVDYNYKP',
'MPAYSSLARRGRRPAVVLLGGLVSASLALTLAPTAAAAPLAPPPGKDVGPGEAYMGVGTRIEQGLGAGPDERTIGPADTSGVQGIDVSHWQGSINWSSVKSAGMSFAYIKATEGTNYKDDRFSANYTNAYNAGIIRGAYHFARPNASSGTAQADYFASNGGGWSRDNRTLPGVLDIEHNPSGAMCYGLSTTQMRTWINDFHARYKARTTRDVVIYTTASWWNTCTGSWNGMAAKSPFWVAHWGVSAPTVPSGFPTWTFWQYSATGRVGGVSGDVDRNKFNGSAARLLALANNTA',
'MTKTYGVDVAVYQPIDLAAYHKAGASFAIVKLTEGVDYVNRRGPSRWTAPGLTTSTLMPTISRSFGSSVSRAKKEAAYFLKEAKKQDISKKRMLWLDWEAGSGNVVTGSKSSNTAAILDFMDAIKAAGWRPGLYSGASLMRTAIDTKQVVKKYGTCLWVASYPTMAAVSTADFGYFRQWTGSPSGSLPVTAWPGRRRERCSG',
'MQLRITSRKKLTSLLCALGLISIVAIYPRQTVNFFYSTAVQITDYIHFYGYRPVKSFAIRIPASYTIHGIDVSRWQERIDWQRVAKMRDNGIRLQFAFIKATEGEKLVDPYFSRNWQLSRENGLLRGAYHYFSPSVSASVQARLFLQTVDFSQGDFPAVLDVEERGKLSAKELRKRVSQWLKMVEKSTGKKPIIYSGAVFYHTNLAGYFNEYPWWVAHYYQRRPDNDGMAWRFWQHSDRGQVDGINGPVDFNVFNGTVEELQAFVDGIKETP',
'MRFIALLISFFALLKVISAISGVDISSASTIESFTCLKSAGYDFAIIRAYESLGQVDPNGPHSVYNARDAGIEYVDVYMFPCPTCGNGAGQAETMVNYLKGYNANYGMVWLDIEGPQYWMSQSENVAFFESLVAGLKAEGAHIGVYTSASQWEPIMGGYTGGSEFPLWYAHYDGNPSFSDFSPFNGWSTPSVKQYDDTGDSCGLGFDLNWYP',
'MHCAPSWKSSDERRTMLDQINTLDPNSLTALKRMSKDNSPAAIKGAAQQFEALFLQNMLKSMRDATVTSDAMGSETTRFYQGLYDQQLAAMMAQRGGIGLADVMEKQMGAQAASAQNAAAAGASSAGNVPLSLDAARAAAAHTASGDKVPTTPQAFVDATWPQAAKAAQSLGVPAHFLVAQAALETGWGKSQIRNKDGTPSYNLFNIKAGSNWTGKVVEARTVEYENGQRKVRVERFRAYDSYEQAFQDYADLVGNSPRYAKVAGKTDGHAFARALQEGGYATDPSYADKLARVINGNALRQRLMASAASARG',
'MINKKWMKIVMIPMLVVPMYGLTSVSGQIQDSLTGENSFVKDAEAATTASQQAFIDKIAPAAQASQEQYHLLSSITLAQAILESGWGKSGLATKGYNLFGIKGKYNGQSVIMSTSEYVNGQWIKIDAEFRKYPSWNESVTDHTLLLVNGTSWNKNLYKKVVDATDYKVAAMELQKAGYASPTYGASLIQVIENYDLAKYDVLYDKILTQKSTSGKATVTSPTGNGVWTLPYKVKGVQSVSPASTYANKDIDLVSVATTKRGTYYQFKYNGKVVGWVDAKALTIYDSVNYDKVNVGRAKITSPVSNGIWSKPYNVYGREFVTNATTYAQQEIKLLREAQTAKGTYYQFSINNKTIGWIDKRALTIYPYDSIVSSKNVSLDGQITNPTGNGIWTKAYKLEGTTSVAQATKYANKDVKISQQVETQHGTYYNISIDGKAIGWLDKNAITLYDQAEYNKTVAFDAAIRNVQGNAVWTEPYRTVGTKLIGPAETYLNKEVEVVREAKTPKGTYYQFKSGGKVIGWLDKKAFEVYDNINYNKAVNLDAVVENVTGNAVWTAPYKSKGVKLVTSAATYKGKATKITREAQTSRGTYYEFSVNGKVIGWLDKKAFDVYDSIEYNKAINMTGLLSNAPGNGIWTEPYRVLDTKNIGQATAYANKTVQLVREAKTSHSTYYQMSLNGKVIGWIDKRAFTNVK',
'MVNTQVKRVKKQKFIAGTALLLGMATFGMVGKADDLSSSNTNGGVDNSKVDNDNQESVKTSTEGVSSTTENANTVPESKVTSTVDSESAPSKTISAGTQSNISGTSDGSDSLPKTETSDSSSKPSTSNSSSKPSTSNSSSKPSTSNSSSNNNSATKPSTTTQAPPVAPSTTAPSATPSTTAPSNYYQNSSYNQTSTAAQIPNSSSDSAASVYSGPVLKKIEAAKPIEKIDSSSTEAFIKSIADRVRILAGKNNLYASIILAQAILESGSGQSNMTQQYFNIFNITGAYLGKSISFKTEEFSGNNPYYIEQSFRVYSNYDQALDDYINLMIKGTTWNSEIYAGAWKSHAKTYQEAAQALQGIFATDPEYAQKLIEIIEEYNLNFYDNVDSTTQVLDSNIPESPLVASKLDSSTYPDYNGVEYPGADSYAFGNCTQYVYNRIIQLGGQIGTHMGNGGEWGINAQAQGYFTTTVPTEGYAVSFPPGVAGSSPEYGHVAFVEKVYPDNSILVSEMNVKGNNIVSERHISAGVAALATYIQPK',
'MNRNRLSCLIVGAVIGAGAIVCTTNTKVHAKPVNEVKNINTSKGNSFGEIISSEDIGLRKGADSSHEIITSIPSGARVNIIDKMSKDWYKVSYKDFTGYLQAKDIRVLGDELNQDNVGLISANQLNVRTSPNENGQVIGTLHKNDKVNVLDKSIDGWYKIDFNGRRAYVSSKYVNLISYKNNEVKTEVKKEPIEGTGKVNINTALNVRQASTTNSRIIGSLKGGEKVNIISESNGFYKIEFNNSYGYVYSKYISKDGDSEKVQVVKQEEVKKEKVDESKKEAKATPKAEPVVLAVRSLNKTGIVNVSSSLNVREGAGTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESSNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSAPENTEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESNNSNQGTQTPEKPSTPESAEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKITIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSTHENSKKTGVVTASKGLNVRKEANTSSQIIGILNSGESVEIIGEENGFYKITYKGQEAYASKNYINIFDGNSNVNPGLDIGNASKTNYGVSLNEYIKLQQRNNPSNYSYSEFEKYINPAKATNKLQFLRIDKFRSVNVSGLSSRLSNKGVLTGQGQAFVNAAKAFNIDPIYLVAQCLHETGNGTSKLAKGVTITEIADESKPIYNGNGQLVGYHMIKLSKPVTVYNLFGIGAKDNSSVFPNRALILGTTYAYNRGWTSIENAIKGAAEFVSLNYVHSSRYSQNTLYKMRYNQNVSNIWHQYATTPWYASSIADIMRSYQDLYLENNFTFDVPVFAG',
'MKKESMSRIERRKAQQRKKTPVQWKKSTTLFSSALIVSSVGTPVALLPVTAEATEEQPTNAEVAQAPTTETGLVETPTTETTPGTTEQPTTDSSTTTESTTESSKETPTTPSTEQPTADSTTPVESGTTDSSVAEITPVAPSATESEAAPAVTPDDEVKVPEARVASAQTFSALSPTQSPSEFIAELARCAQPIAQANDLYASVMMAQAIVESGWGASTLSKAPNYNLFGIKGSYNGQSVYMDTWEYLNGKWLVKKEPFRKYPSYMESFQDNAHVLKTTSFQAGVYYYAGAWKSNTSSYRDATAWLTGRYATDPSYNAKLNNVITAYNLTQYDTPSSGGNTGGGTVNPGTGGSNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSGSGGSNNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSNNGGSNNNQSGTNTYYTIKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFAGQKIIVKKGTSGNTGGSSNGGSNNNQSGTNTYYTIKSGDTLNKISAQFGVSVANLQAWNNISGSLIFAGQKIIVKKGANSGSTNTNKPTNNGGGATTSYTIKSGDTLNKISAQFGVSVANLRSWNGIKGDLIFAGQTIIVKKGASAGGNASSTNSASGKRHTVKSGDSLWGLSMQYGISIQKIKQLNGLSGDTIYIGQTLKVG',
'MKKRLIAPMLLSAASLAFFAMSGSAQAAAYTDYSLYKVEPSNTFSTESQASQAVAKLEKDTGWDASYQASGTTTTYQISASGIHSESEAKAILSGLAKQTSITGTSSPVGSKQPYVTISSGAISGEKQANTILAKLKQETGVAGAVKAYGAAQPYMNVMTSDIADETKVKALIQSLAKQTGIKSSYQPITHTVSVTTIQSGTIVGDSRAAQIKNAFQKESGLQASLKETVKGQAYYTFTTAAISGEANAKTLLQQLKQSTGITGSYKSINQKTTVESYNVQSAYFKGLSTVKDAISQIKKNTGVSGSYQQVGKSTSYTVNMKGITKQQLQKIDTFFKKKKWHYTSSSVKKTTTSAAYQITTAKILGEQQANKAAAFFAQKKVKAAKTAAGSTAENQYQLISEETSDQAKVTKGLNILKKNQLSASAKSVKKQIADTFKITTESLLDQTKVNQALTFFKSNHISVASQKTGQTAASSYQITTEAIISQEEIDRVLTFFKQNHIAVTTSKTGQTAYTQYKIVTTQLSSKTALNNGLTYLKSKSVTPSYTTKSNTLYKISVNEQFTGNDTAAAASTKLKQLYGWTSSIVKIKNGPQIMKTNYNLSLRDMVQKQMTVSPQTDGAAYVSLTYINTATSTVTADVLNIRSTPEVSPTNVIGQFKKGDKVKVIGQINGWAKINLGWRNASSDEVVQYVDPNNFSRDSKYYFQFLKLSQTAGLSVTEVNQKVLAGKGILTGRAKAFIDAANQYSINELYLISHALLETGNGTSALANGLTYNGKTVYNMYGIGAYDSNPNYYGAKYAYEQGWFTPEAAIIGGAKFIGSSYIHNTAYNQDTLYKMRWSATATHQYATDIGWAYKQVNRMYSLYSLLDGYTLYFDVPEYR',
'MARKKLKKRKLLISLFFLVSIPLALFVLATTLSKPIEISKETEEIDEQQVFIDSLSGHAQILYEKYHVLPSITIAQAILESDWGNSELAAKANNLFGVKGNYKGHHVTMETDEVEKGKRKTIRAKFRKYSTFFESMDDHAQLFVRGTSWNKKKYKPVLEAGNYKEAATALQTSGYATDPDYADKISAIVEKYDLDEYDEVNPSLKSVDLNASIKDSAVQDVWSKPSTDDRSIRLTSAQSYVGKDIKVVSKKQKGQSVWYQFQINDKLIGWIDDSAVEIKEAT',
'MARKLIKNLGKSKSVKRVKLLFKKIFITVFIVASIVAIFNITKYFEELYKVRDLKSTKIEYYMDVADEAGDGKVQLSWKALLAIDMVIHDEDLSNIKKKDTLDIGEKFIVEDKNDKGEKVYKVKKFNKVLSELKFDSSQKSRARKYMKDLEYTYLGNKQLDSSDEKIKFIKKLEDSAIREYIDYGILPSITIGQAILESGWGNSKLTKQSNNLFGIKADKAWKGKSVEISTSEHYNEKIVASFRSYNSLQDSVKDHSLFLINNKRYRKHGLFEAKDYISQAQALENAGYSTAEDKKGNRIYAELLIDVIRSYNLQLIDNKVETK',
'MFFLTLPLLLGCTAATTPLTAATPPVDPLPLKVVSTDQLPKGLAKDQQLWNKVNGQKGDYKALLTAIDHSLEYLGTDKAQKDYQDYKVPGITRDRVSRSLRRFRQLVVQAKSPQALETAVKKEFQFYQSIGNDQKGNVDFTGYYEATYPASRQPTTEFRYPLYQAPADLKAWPKPHPTRAELEGADGLQASQGPLKGLELVWLRDRIQAFLVQVQGSARLGLTDGTEMTVGYAGKTAHPYTSIGKALIADGKFTLEELSLPVVLQYFEENPQDLDLYIPKNKSFVFFQETFGSPPMGNLNVPVTDERSIATDKSLMPPGALALIQTNLPYYNASQTLEFKDVSRFVLDHDTGSAIKGPGRVDIFMGTGAKAKERAGVMTGSGQLYYLLLKDN',
'MNTPFSIDEVSFRDLPGWGQDDPRKLFPAMATILSHLRNAKPYRTGALGITAAELVSLLELAERGQVNSPEQARQFFETNSVPFRISPAQGKSGFVTAFYEPELEVSATPDDVWRYPIYRRPPELVDIDNDNRPDGFDPSYAFGKADEEGISYFPDRRAIDEGCLRGRGLEIAWARSKVDLFFVHVQGAARLVFPDGAIKRITYAAKAGHVFSPIGRLLLDRGELDPKTISMQTIRQWLADHPDEVDGVLWHNRSYIFFREADVAGLDMGPIAAAKVPLVAGRALAVDRLIHTFGLPFFIHAPTLTHLDDGKPFARLMLALDTGSAIVGPARGDIFTGSGFEAGELAGTVRNEADFYILLPRIAAERYRR',
'MRKIQVAVFLFVGLLAACSTVPPSSAPTTCAQCQPCPACPAVTPAITPAPAPAFSRSLLPASWGDLPGWAEDDVTAAWPAFMQSCRGIASRGNAAGWRRVCELARAADGKPENDVRRFFERHLKPYAIVNGDGLVSGLVTGYYEPMLRGSRTKAKGYEQPVRGVPDDLLTIDLSAVFPELKDKRVRGRLEGNKVVPYWSRAEIAARGDKLPGKTLLYVDDAVELFFLQVQGSGRVKLADGGMVRLNYADQNGYQYQSIGKALVERGELKLEEASMQGIQAWARANPARLESLLNTNPSYVFFREVANSADGPVGALGVPLTAERSIAIDPRSVPLGSPVFLATTRPNSAVPLNRLVMAQDTGGAIKGGVRADFFWGFGKEAGDQAGRMKQSGRMWILLPTELAPK',
'MKGRWVKYLLMGTVVAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQINHIRNSSPRLYGNQSNVYNAVQEWLRAGGDTRNMRQFGIDAWQMEGADNYGNVQFTGYYTPVIQARHTRQGEFQYPIYRMPPKRGRLPSRAEIYAGALSDKYILAYSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGHAYRSIGKVLIDRGEVKKEDMSMQAIRHWGETHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLVGRASVASDRSIIPPGTTLLAEVPLLDNNGKFNGQYELRLMVALDVGGAIKGQHFDIYQGIGPEAGHRAGWYNHYGRVWVLKTAPGAGNVFSG',
'MKKYLFRAALCGIAAAILAACQSKSIQTFPQPDTSVINGPDRPVGIPDPAGTTVGGGGAVYTVVPHLSLPHWAAQDFAKSLQSFRLGCANLKNRQGWQDVCAQAFQTPVHSVQAKQFFERYFTPWQVAGNGSLAGTVTGYYEPVLKGDDRRTAQARFPIYGIPDDFISVPLPAGLRSGKALVRIRQTGKNSGTIDNTGGTHTADLSQFPITARTTAIKGRFEGSRFLPYHTRNQINGGALDGKAPILGYAEDPVELFFMHIQGSGRLKTPSGKYIRIGYADKNEHPYVSIGRYMADKGYLKLGQTSMQGIKAYMQQNPQRLAEVLGQNPSYIFFRELTGSSNDGPVGALGTPLMGEYAGAVDRHYITLGAPLFVATAHPVTRKALNRLIMAQDTGSAIKGAVRVDYFWGYGDEAGELAGKQKTTGYVWQLLPNGMKPEYRP',
'MKFPFHPWRRLLLCALPFAALLTACDDGKKEPPPTPAEVTTYNSVPWDALPATSDADLLAGFNAWRSACARLAKDPVWGEPCASATTVAADPTAVRAFLQERMQVYSLRSSSNGDQGLITGYYEPVYHGSLSQGEKTPVPVYGVPDDLVVVALESVYPELKGKRLRGRLEGRVLKPYDDAATIRDNGSSAPVLAWLGDPMDLQFLQIQGSGRIQLEDGRQLRIGYGDQNGHPYKPVGRWLVEQGLVPKEEISMKRIRDWAEANPQRVSELLASNPSFVFFSLRPDSDEGPRGSLNVPLTDGYSVAIDRKVIPLGSLMWLSTTRPDDGSAVVRPVAAQDTGGAIVGEVRADLFWGTGDAAGELAGHMKQPGRLWLLWPKGAPLPAS',
'MGAMNGTSGRRLSTATRVAAMAGVLLLAACGGPSSRPGLVSRPAGVAGPVSYQRVAIEGLPGWSTDRVADALPVFRRSCERLRAVSPNSMVGPSVWGSRASDWQAACAVAARLPAFDDDAARRFFAERFQAWQVTGAGDPTGLFTGYYEAALDGSLSPSAVYSTPIYGVPLDLRMEGGKGMRVSGGRSLPYPDRAAIEEGAISGVAPVIMWARDPVDVFMLHIQGSGQVRLPDGRIQRIGYAANNGHPFVGIGAIMRDRGLGDGSSMIAIRAWLRANPAEGRALMRENPRFIFFRPIEGEGPIGAQGLPLTGGRSLAVDPSSVPLGAPVWLATSDAHGETVNRLMVAQDTGSAIKGAVRGDFFWGSGEEALYHAGGMKSAGRYWVLVPRGGRNAVAQN',
'MKGRWAKYVATGVMLAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQVNQIRSASPRLYTNQSNVYNAVQNWLRSGGDTRTMRQFGIDAWQMEGTDNYGNVQFTGYYTPVVQARHTRQGAFQYPIYSMPPKRGRLPSRAQIYAGALSDKYILAWSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGWPYRSIGKVLIDRGEVKKEDMSMQAIREWGEKHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLIGRASVASDRSIIPPGTTLLAEVPLLDNNGKFSGQYELRLMVALDVGGAIKGQHFDIYQGIGPDAGHRAGWYNHYGRVWVLKSAPGAGNVFSG',
'MFKRRYVTLLPLFVLLAACSSKPKPTETDTTTGTPSGGFLLEPQHNVMQMGGDFANNPNAQQFIDKMVNKHGFDRQQLQEILSQAKRLDSVLRLMDNQAPTTSVKPPSGPNGAWLRYRKKFITPDNVQNGVVFWNQYEDALNRAWQVYGVPPEIIVGIIGVETRWGRVMGKTRILDALATLSFNYPRRAEYFSGELETFLLMARDEQDDPLNLKGSFAGAMGYGQFMPSSYKQYAVDFSGDGHINLWDPVDAIGSVANYFKAHGWVKGDQVAVMANGQAPGLPNGFKTKYSISQLAAAGLTPQQPLGNHQQASLLRLDVGTGYQYWYGLPNFYTITRYNHSTHYAMAVWQLGQAVALARVQ',
'MFALTAYRLRCAAWLLATGIFLLLAGCSEAKAPTALERVQKEGVLRVITRNSPATYFQDRNGETGFEYELAKRFAERLGVELKIETADNLDDLYAQLSREGGPALAAAGLTPGREDDASVRYSHTYLDVTPQIIYRNGQQRPTRPEDLVGKRIMVLKGSSHAEQLAELKKQYPELKYEESDAVEVVDLLRMVDVGDIDLTLVDSNELAMNQVYFPNVRVAFDFGEARGLAWALPGGDDDSLMNEVNAFLDQAKKEGLLQRLKDRYYGHVDVLGYVGAYTFAQHLQQRLPRYESHFKQSGKQLDTDWRLLAAIGYQESLWQPGATSKTGVRGLMMLTNRTAQAMGVSNRLDPKQSIQGGSKYFVQIRSELPESIKEPDRSWFALAAYNIGGAHLEDARKMAEKEGLNPNKWLDVKKMLPRLAQKQWYAKTRYGYARGGETVHFVQNVRRYYDILTWVTQPQMEGSQIAESGLHLPGVNKTRPEEDSGDEKL',
'MIGADTAKECDAMTFKLLPLAVLCAALVGCQSAQSRDARAESPATAESAAPTAEAPVSEAQEADFETWLANFRRQARGEGIDEATLARALDGLRYRPRVIELDGSQPEFVRPIWEYLDSAVSASRVKKGRERLAEYRDTVRQMTERYGVPGEVLVAIWGIESSYGDYLGDFSTLEALATLAYDGRRRDFARGELLAALRIIEAGDISPERMKGSWAGAMGHTQFIPSSFLAHAVDGDGDGRRDIWNSIADVLASTANYLDEAGWREGEPWGTEVSLPQGFDYTLTEPDIRRSSAEWAAAGVRSRDGHALPDFASASVIAPAGAQGPVFLVGHNFRVILRYNNATSYALAVATLSDAIAGRAGIQGEWPREQPALKRSEVREMQQLLDARGFDVGTPDGILGPNTRRGLRAFQREIGVTPDGFATKALLERLRR',
'MPGLPRARMAQWHPLYSVRLAKDTMTDTQRSLRRPLLGAALSAAALGLCGLSPSLLAAGKRRVSLREEEIEPGRYRDNPQARAFIDEMVARHGFDRGMLQDWFGQAVYSATVVRLIMPPATTGRKSWRTYRSRFIEPIRINAGVRFWQDNRDTLRRAEAEFGVPASVIVGIIGVETIYGRDMGSFRVLDSLSTLAFDYPATPNREARSTLFRNQLADYLLWCRDTRTDVYSVLGSYAGAIGIPQFMPTSLREYALDYDNNGHIDLRNSPTDAIGSVARFLQLHGWEPGRPVVWRIAPDDGSLGVATAAADGEPWPTRTLNQLTRAGLRVDEPINLAREGETGVLVVDLPTPDQPTEYLLGLRNFYVLTRYNRSFFYALAVYQLGEAVKAAMG',
'MFGILNRREMLRGTAATLLLPGILTSAHAGQVAEDPLLRYPWLAQWAGADGLDAPWLRGVFQNLKKYPRVIRAMNHQAEAKPFYLYREHVTSPWLYKKGREAWQQHRAMLEAAGARYGVDAPFVLALWGMESRFGRNQGEHPVLRTLFTLAVDYPRRQTFFRQELRHFLILCRQQGWDPMLLKGSYAGAMGHVQMIPSSLRYYAVDGDGDGRLDVFNNPMDATASIAHYLGKHGWELGGPYLIPVYGITDLSAIKSAKVKEMQPWSSWYALGVRTRGEPPPAERAMALIALEEQDGLRYYGVFNNFRVILDWNRSTRFAKVVGELAEGFVL',
'MPTPATRASLIGLALASGLLAGPARADFQSCLAGIQAQAAGAGVSAQTFRAATANIAYDDKVIELSQAQPEFKTPIWDYMSALVDEERVEDGRAAMRQHAQALANAEARYGVDRHTIAAVWGVESNFGKNLGKMPLVQSLATLACSSNRRRDFFRSELIATLKIIERGDIEASRLTGSWAGAFGQTQFMPTTYQRLAVDGDGDGRRDVVDSVADAVASTANFLRVAKWSNGQPWGYEVRLPRGFNVAAAGRKNKHAVGHWASLGVTRVDGKALTGDGPAGIIAPAGINGPAFLVTKNFDAIYSYNAAESYGLAIAVLSDRLRGRPGVQADWPTDDPPLSRAERRDLQTRLTARGYDVGEPDGKVGSKTREAIKEIERQLGMPATGRPGGKVLEALRRG',
'MFKYSFIAVIVSTVLLSACADSHQKSAEKKPVTSEIANIATSAPARWKQIDVVSLEQAFPKQSRTPAQFPAYVDALKQKAAELGYKPETINFAFSEIHFIDRVVKSDRNQPEKKITLDVYLPRVVTKGRIAEGAKLYQANQQTLAQISNQYGVPANYIVALWGLESGFGRVQGKEDVISALATLAFEGRREALFSRQLMAALEIIENGHLPVGQRLKGSWAGAMGQTQFMPSSFLTYAADGNGDGNIDIWNSREDAFASAANYLATEGWQRDLPWGEQVSLPANFNQQLEGIKTEQQKTVAQWKALGVQLPANSQLSDDMKVWLIIPDDDLHRSYLVTQNFRTIMHWNSSYFFALSIVTMADGVANKINTLPTQH',
'MKKESRPAFDAAAVFDAAAVPVSDSGFAANANVRRFVDDEVGKGDFSRAEWQDFFDKAAYKADIVKIMHRPSTSRPWYVFRTGNSGKAKFRGARRFYAENRALIDDVAQKYGVPAELIVAVIGIETNYGKNTGSFRVADALATLGFDYPRRAGFFQKELVELLKLAKEEGGDVFAFKGSYAGAMGMPQFMPSSYRKWAVDYDGDGHRDIWGNIGDVAASVANYMKQHGWRTGGKILVSATLAPGADVQAIIGEKTALTRTVADLKAYGIIPGEELADDEKAVLFKLETAPGVFEYYLGLNNFYTVWQYNHSRMYVTAVRDIANSLGGSGL',
'MASSSSSKQAKPIHRMAWRLGVSLTLLLGLGALFVLPKFDPKSLTWPTTEPGRIAPLAMSGGNPYLRALMRTISASESNDASPYTVLYGGSHIENLQEHPDRCIPIRWGPNQGLCTTAAGRYQFITTTWLETAEKYHPAPTGEWMWRRYSFAPEYQDRVVYAWLDDVNYWGTDIPQLLEDGQLQTVLKRLSGTWTSLGYGIESNKVTPHLMHIYERMLAEEIALANGLPTNYLPTVANQSVETTR',
'MIIQHSQPKRKGTKYRLKKPYKLVFNLIIVVGLIGLVYSFKKNTQPLVNPSLVTHLPELEMSGGDPYIRALMLTISASESNHKNSYYLLYGGSHVHNLQQHPDQCIPINIGPNRGNCSTAAGRYQFLNSTWQEKARKYHPNPQKNYRQYIYSFEPKYQDIVVYRWLKDHHQWNVDLLTLLKQDQVEEVLRKLSNVWTSLGGGIEDNSMTPHLPSIYRYFLAQELNRENADQNSL',
'MVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTAAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIVKFKEAGGTVREIEV',
'MGYTWKGLAKQYGFTDFSPATQDKAAVALILAKKGAMEAILNGDYEQAVMKLGGIWASFPTAPNEYRQHKRSWGFVHNFFRQRGF',
'MARISAADAGGVNVIAFLDMLAWSEGTSTIKASDYGYDVLVGGKLFSEYSKHPRVKVWLPKYSIYSSAAGRYQFLAGTWDAIVKNYGFKGRFIPEAQDLAAIKLLTECGALPLIKAGRIVEAIAKAAPIWASLPGAGYGQREHKLAALLGIYEAERAAEAKPQDQLLAMFSACGGEMAA',
'MTRYEFALLALAAVGYVVWRDWQRSEEPGAQSPDFIDQAENLFYDATEGNFFGGTEDTDMGQAQLNRAAFLLTIRTGEGTAGNDGYRMLFGGGKFDSFADHPRQVVTALSNGKPISSSAAGAYQFLRRTWDTLAARLGLTDFSPASQDAAALELIREAGALGDVDAGRFALAVRKVRKIWASMPGAGYGQPEVALERLQAAYQAAGGVVNG',
'MPVINTHQNIAAFLDMLAYSEGTANHPLTKNRGYDVIVTSLDGRPEIFTDYSDHPFAHGRPAKVFNRRGEKSTASGRYQQLYMFWPHYKKQLALPDFSPLSQDKLAIQLIRERGAIDDIRAGRIERAVSRCRNIWASLPGAGYGQREHSLEKLVTVWRTAGGVVA',
'MYSQQVQQINQPQKNSDIQLINMWLQQIHPIQQNSHLYIAQMFLKFIKKPLKKVTSADVIAFANVYGVRSHNSHSNQQKRIETINSLLKFGQEAGILPRNQKKTFSPNTTNFKTSVYSQNKIKNYRTTGKQQKKPLNWSQLFNLQLASSVLIVFILLMAILQLFRQVSGSTNANQNKSVTSVVMPKIDPTKNWAYPVNVPRIRAFLDTIAVTEGTTGPKGYYRQYTGSHFLSFEDHPRELKCANSNGKKLCSDAAGRYQFLSTSWDRFAPVVKAQNFSPTYQDRVAIELIRDKNALKDIEEGRVKEAFQKLYMVWPSFGETETDVEQLMPKLVGTYEQKLALYQIKN',
'MDDEFERAFKKILDYEGGYSDEQKDHGGKTKYGITEKLARDYGHEGEMKDLELEKAKEIYYREFWANHLYSWIEDERIATEVFEQAVNMGAKTANKHLQKAYNLLADKEIAVDGIIGQRTLEAVNNFEHNSDLFKLLNILQAKKYINIVKNDASQQKFIRGWLRRVELDIDSRKS',
'MKRNFQTVMPYIFSEEGGYADNPADPGGATNMGITINTLSAWEGRQVSPQDVKELTQATATQIYQVEFWNKIDGNDLPSGVDYALFDFAVNSGPGRAAKTLQKILAMPEDGIIGAQTVAAAAARSPEGIINALCDARAAWLRGLSTAATFGNGWLARVERVRARALALAATPPAITQPADPAGNPSPKARQADIAFTSALKHPEALGTMGSVASGLAAIATGNGPVQYALAIVMVACAGVGLWYFVRRVRSEP',
'MNFDQAFDRLLGHEGGYSNNSADPGGETMWGVTARVARADGYLGEMRDLPRDRAKSIYRRLYWTPVRADELPEVVRFDVFDGAVNSGPAQSIKWLQRAAGAVDDGILGPRTMAAAVAAGPVLAARYNGHRLLFLADRPTWGSFGKGWARRVGKNLLGA',
'MDQPPWLQAAWAEFGVREIPGKEDAPEILRYFRDAGDTNVETEATPWCAAFLGAMLKRAGYAGTGSLLARSYLDWGDRLDDARFGAVAVLSRGDDPNAGHVGFLLSDTNGKLYLLGGNQGDAVTVASFDKARLLGLRWPKENVEAASKGDDAIFSRVLAHVLEMEGGFSNDPYDPGGPTNRGITLEVYAKFRKETLDDGTRARLIAELKRIPDAIVTAIYRQRYFDPASCPVFTAPLALMHFDAAVNHGVGAAIRMLQGVAGVTVDGEIGPETLAAIGAKSLADLLDDYAETRRARYRALPHFWRFGRGWLKRVDATLALARTWAAAEATNRGLIEPQQIAKGEGKMGEKSKTEISSSDDSKWWLNSKTMWGTLITAAATVIPVLGPAVGIVLPADLITSFGDQVVTAAQALAGLFGTALAIYGRLKADTPLVLRKN',
'MSAPLTFQQVFDRVVGHEGGYVNDPHDPGGETNWGITKYTARENGYTGSMKAMTREQAYKIYEKAFWQRYHCEKLPEAVAFQFFDAAVNHGVGNASRMLQRAVNVADDGIIGKVTLSAVEKMPISDLLLRFNAERIRFYTKLKNFPRYGKGWMNRIAGNLAYAAIDNEV',
'MNPIIDGIIALEGGYVFNPKDKGGATHWGITEATARAHGYAGDMRDLTHAEAYAILEEDYWIKPGFDVISTLSWPVSFELCDAAVNIGAYHPSAWLQRWLNVFNHEGKRYPDIHVDGNIGPRTLAALEHYLAWRGQEGEAVLVKALNCSQGTYYLNVAEKNHNNEQFIYGWIKNRVT',
'MDSFEDAFKALIGNEGGYSFNPADPGGETMWGVTARVARSEGYNGAMKDLPLETAHQIAKRRYWDPLHLDELDPRVAFQIFDANYNGGLVVLWMQKASGAKEDGKFGPDTLDAVKNADPMKFVMRFAAYRLRYLRNLHSWPSFSRGWTERMAANLLLGAA',
'MSQTATLSDFNKAFDRVIQHEGGYVNDPRDAGGETKFGITIHTARANGYTGSMFTMTRDDAKQIYLKAFWQRYRCNEFPPELAFQFFDACVNHGSGNASRMLQRAVGVVDDGIIGEITLAAIRKRSTVEVVTLFNAERLEFYTKLSGFQHFGKGWIRRMAGNLRHIADDVGDK'],
'letters': 'MRKFNKPLLALLIGSTLCSAAQAAAPGKPTIAWGNTKFAIVEVDQAATAYNNLVKVKNAADVSVSWNLWNGDAGTTAKILLNGKEAWSGPSTGSSGTANFKVNKGGRYQMQVALCNADGCTASDATEIVVADTDGSHLAPLKEPLLEKNKPYKQNSGKVVGSYFVEWGVYGRNFTVDKIPAQNLTHLLYGFIPICGGNGINDSLKEIEGSFQALQRSCQGREDFKVSIHDPFAALQKAQKGVTAWDDPYKGNFGQLMALKQAHPDLKILPSIGGWTLSDPFFFMGDKVKRDRFVGSVKEFLQTWKFFDGVDIDWEFPGGKGANPNLGSPQDGETYVLLMKELRAMLDQLSAETGRKYELTSAISAGKDKIDKVAYNVAQNSMDHIFLMSYDFYGPFDLKNLGHQTALNAPAWKPDTAYTTVNGVNALLAQGVKPGKVVVGTAMYGRGWTGVNGYQNNIPFTGTATGPVKGTWKNGIVDYRQIAGQFMSGEWQYTYDATAEAPYVFKPSTGDLITFDDARSVQAKGKYVLDKQLGGLFSWEIDADNGDILNSMNASLGNSAGVQMSTRKAVIGYYFIPTNQINNYTETDTSVVPFPVSNITPAKAKQLTHINFSFLDINSNLECAWDPATNDAKARDVVNRLTALKAHNPSLRIMFSIGGWYYSNDLGVSHANYVNAVKTPAARTKFAQSCVRIMKDYGFDGVDIDWEYPQAAEVDGFIAALQEIRTLLNQQTIADGRQALPYQLTIAGAGGAFFLSRYYSKLAQIVAPLDYINLMTYDLAGPWEKITNHQAALFGDAAGPTFYNALREANLGWSWEELTRAFPSPFSLTVDAAVQQHLMMEGVPSAKIVMGVPFYGRAFKGVSGGNGGQYSSHSTPGEDPYPNADYWLVGCDECVRDKDPRIASYRQLEQMLQGNYGYQRLWNDKTKTPYLYHAQNGLFVTYDDAESFKYKAKYIKQQQLGGVMFWHLGQDNRNGDLLAALDRYFNAADYDDSQLDMGTGLRYTGVGPGNLPIMTAPAYVPGTTYAQGALVSYQGYVWQTKWGYITSAPGSDSAWLKVGRLAMLSFVKKSIALVAALQAVTALATPISSEAGVEKRGSGFANAVYFTNWGIYGRNFQPADLPASEITHVLYSFMNVRADGTIFSGDTYADYEKHYAGDSWNDVGTNAYGCVKQLYLLKKQNRNMKVMLSIGGWTWSTNFPAAASSAATRKTFAQSAVGFMKDWGFDGIDIDWEYPADATQAQNMVLLLQAVRSELDSYAAQYAKGHHFLLSIAAPAGPDNYNKLKFAELGKVLDYINLMAYDYAGSWSNYTGHDANIYANPQNPNATPYNTDDAVQAYINGGVPANKIVLGMPIYGRSFQQTEGIGKPYNGIGSGSWENGIWDYKALPKAGATVKCDDTAKGCYSYDPSTKELISFDTPAMISTKVSWLKGKGLGGTMFWEASASKKGSDSLISTSHQGLGSQDSTQNYLDYPNSKYDNIKKGMNMILNLIILLAISIVASASNIAAYWGQNAGGDQQTLGDYCSSSPASIIILSFLDGFPNLSLNFANQCSGTFSSGLAHCSQIGSDIKSCQQQGKTILLSLGGATGNYGFSSDSEAVQFAGTLWNKFGGGKDSERPFDDAIVDGFDFDIENKDQTGYAALATQLRKYFSTGTKSYYLSAAPQCPYPDESVGDLMSQVDLDFAFIQFYNNYCSLNQQFNWNSWSNYARGKSIKLYLGLPGSSSSAGSGFVGLSTVQRVVASIKGDSSFGGISIWDISSAENGGYLNQLYQALSGSGSPAAPSNSYQPNTPLTRTYGGSTATASAYISVGFTAGATHGSTTTNDLLAWIDSLFGSSQSSVQQYATPVQSVTATPQPVAATTTSAPKPTASAFNWFGWFDGTTTSTTLQTVYSTVPADQTVYVTLTTTVGSQMLQSLFDKRDVIAEAKSTNLQICWLLFIPLLALICSMAKRTQAILLLLLAISLIMSSSHVDGGGIAIYWGQNGNEGTLTQTCSTRKYSYVNIAFLNKFGNGQTPQINLAGHCNPAAGGCTIVSNGIRSCQIQGIKVMLSLGGGIGSYTLASQADAKNVADYLWNNFLGGKSSSRPLGDAVLDGIDFDIEHGSTLYWDDLARYLSAYSKQGKKVYLTAAPQCPFPDRYLGTALNTGLFDYVWVQFYNNPPCQYSSGNINNIINSWNRWTTSINAGKIFLGLPAAPEAAGSGYVPPDVLISRILPEIKKSPKYGGVMLWSKFYDDKNGYSSSILDSVLFLHSEECMTVLMTKLILLTGLVLILNLQLGSAYQLTCYFTNWAQYRPGLGRFMPDNIDPCLCTHLIYAFAGRQNNEITTIEWNDVTLYQAFNGLKNKNSQLKTLLAIGGWNFGTAPFTAMVSTPENRQTFITSVIKFLRQYEFDGLDFDWEYPGSRGSPPQDKHLFTVLVQEMREAFEQEAKQINKPRLMVTAAVAAGISNIQSGYEIPQLSQYLDYIHVMTYDLHGSWEGYTGENSPLYKYPTDTGSNAYLNVDYVMNYWKDNGAPAEKLIVGFPTYGHNFILSNPSNTGIGAPTSGAGPAGPYAKESGIWAYYEICTFLKNGATQGWDAPQEVPYAYQGNVWVGYDNIKSFDIKAQWLKHNKFGGAMVWAIDLDDFTGTFCNQGKFPLISTLKKALGLQSASCTAPAQPIEPITAAPSGSGNGSGSSSSGGSSGGSGFCAVRANGLYPVANNRNAFWHCVNGVTYQQNCQAGLVFDTSCDCCNWAMKKFINQFSASLKNNILVFLAFPFVWTSCARDNPLSSENSNISPNAAARAAVTGTTKANIKLFSFTEVNDTNPLNNLNFTLKNSGKPLVDMVVLFSANINYDAANDKVFVSNNPNVQHLLTNRAKYLKPLQDKGIKVILSILGNHDRSGIANLSTARAKAFAQELKNTCDLYNLDGVFFDDEYSAYQTPPPSGFVTPSNNAAARLAYETKQAMPNKLVTVYVYSRTSSFPTAVDGVNAGSYVDYAIHDYGGSYDLATNYPGLAKSGMVMSSQEFNQGRYATAQALRNIVTKGYGGHMIFAMDPNRSNFTSGQLPALKLIAKELYGDELVYSNTPYSKDWMKLNIFTKSMIGMGLVCSALPALAMEAWNNQQGGNKYQVIFDGKIYENAWWVSSTNCPGKAKANDATNPWRLKRTATAAEISQFGNTLSCEKSGSSSSSNSNTPASNTPANGGSATPAQGTVPSNSSVVAWNKQQGGQTWYVVFNGAVYKNAWWVASSNCPGDAKSNDASNPWRYVRAATATEISETSNPQSCTSAPQPSPDVKPAPDVKPAPDVQPAPADKSNDNYAVVAWKGQEGSSTWYVIYNGGIYKNAWWVGAANCPGDAKENDASNPWRYVRAATATEISQYGNPGSCSVKPDNNGGAVTPVDPTPETPVTPTPDNSEPSTPADSVNDYSLQAWSGQEGSEIYHVIFNGNVYKNAWWVGSKDCPRGTSAENSNNPWRLERTATAAELSQYGNPTTCEIDNGGVIVADGFQASKAYSADSIVDYNDAHYKTSVDQDAWGFVPGGDNPWKKYEPAKAWSASTVYVKGDRVVVDGQAYEALFWTQSDNPALVANQNATGSNSRPWKPLGKAQSYSNEELNNAPQFNPETLYASDTLIRFNGVNYISQSKVQKVSPSDSNPWRVFVDWTGTKERVGTPKKAWPKHVYAPYVDFTLNTIPDLAALAKNHNVNHFTLAFVVSKDANTCLPTWGTAYGMQNYAQYSKIKALREAGGDVMLSIGGANNAPLAASCKNVDDLMQHYYDIVDNLNLKVLDFDIEGTWVADQASIERRNLAVKKVQDKWKSEGKDIAIWYTLPILPTGLTPEGMNVLSDAKAKGVELAGVNVMTMDYGNAICQSANTEGQNIHGKCATSAIANLHSQLKGLHPNKSDAEIDAMMGTTPMVGVNDVQGEVFYLSDARLVMQDAQKRNLGMVGIWSIARDLPGGTNLSPEFHGLTKEQAPKYAFSEIFAPFTKQMSTPRAAASLAKKAALVALAVLAAALATAARAEQCGAQAGGARCPNCLCCSRWGWCGTTSDFCGDGCQSQCSGCGPTPTPTPPSPSDGVGSIVPRDLFERLLLHRNDGACPARGFYTYEAFLAAAAAFPAFGGTGNTETRKREVAAFLGQTSHETTGGWPTAPDGPFSWGYCFKQEQNPPSDYCQPSPEWPCAPGRKYYGRGPIQLSFNFNYGPAGRAIGVDLLSNPDLVATDATVSFKTALWFWMTPQGNKPSSHDVITGRWAPSPADAAAGRAPGYGVITNIVNGGLECGHGPDDRVANRIGFYQRYCGAFGIGTGGNLDCYNQRPFNSGSSVGLAEQMPPQKENHRTLNKMKTNLFLFLIFSLLLSLSSAEQCGRQAGGALCPNGLCCSEFGWCGNTEPYCKQPGCQSQCTPGGTPPGPTGDLSGIISSSQFDDMLKHRNDAACPARGFYTYNAFITAAKSFPGFGTTGDTATRKKEVAAFFGQTSHETTGGWATAPDGPYSWGYCFKQEQNPASDYCEPSATWPCASGKRYYGRGPMQLSWNYNYGLCGRAIGVDLLNNPDLVANDAVIAFKAAIWFWMTAQPPKPSCHAVIAGQWQPSDADRAAGRLPGYGVITNIINGGLECGRGQDGRVADRIGFYQRYCNIFGVNPGGNLDCYNQRSFVNGLLEAAIMRLCKFTALSSLLFSLLLLSASAEQCGSQAGGARCPSGLCCSKFGWCGNTNDYCGPGNCQSQCPGGPTPTPPTPPGGGDLGSIISSSMFDQMLKHRNDNACQGKGFYSYNAFINAARSFPGFGTSGDTTARKREIAAFFAQTSHETTGGWATAPDGPYAWGYCWLREQGSPGDYCTPSGQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSALWFWMTPQSPKPSCHDVIIGRWQPSAGDRAANRLPGFGVITNIINGGLECGRGTDSRVQDRIGFYRRYCSILGVSPGDNLDCGNQRSFGNGLLVDTMMRSLAVVVAVVATVAMAIGTARGSVSSIVSRAQFDRMLLHRNDGACQAKGFYTYDAFVAAAAAFPGFGTTGSADAQKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGASSDYCTPSAQWPCAPGKRYYGRGPIQLSHNYNYGPAGRAIGVDLLANPDLVATDATVGFKTAIWFWMTAQPPKPSSHAVIAGQWSPSGADRAAGRVPGFGVITNIINGGIECGHGQDSRVADRIGFYKRYCDILGVGYGNNLDCYSQRPFAMGAFALFAVLAMAVTMAVAEQCGSQAGGATCPNCLCCSRFGWCGSTSDYCGDGCQSQCAGCGGGGTPVTPTPTPSGGGGVSSIVSRALFDRMLLHRNDGACQAKGFYTYDAFVAAAGAFPGFGTTGSTDTRKREVAAFLAQTSHETTGGWATAPDGAFAWGYCFKQERGATSNYCTPSAQWPCAPGKSYYGRGPIQLSHNYNYGPAGRAIGVDLLRNPDLVATDPTVSFKTAMWFWMTAQAPKPSSHAVITGQWSPSGTDRAAGRVPGFGVITNIVNGGIECGHGQDSRVADRIGFYKRYCDILRVGYGNNLDCYNQRPFAMRLSEFTTLFLLFSVLLLSASAEQCGSQAGGALCASGLCCSKFGWCGNTNEYCGPGNCQSQCPGGPGPSGDLGGVISNSMFDQMLNHRNDNACQGKNNFYSYNAFVTAAGSFPGFGTTGDITARKREIAAFLAQTSHETTGGWPTAPDGPYAWGYCFLREQGSPGDYCTPSSQWPCAPGRKYFGRGPIQISHNYNYGPCGRAIGVDLLNNPDLVATDPVISFKSAIWFWMTPQSPKPSCHDVITGRWQPSGADQAANRVPGFGVITNIINGGLECGHGSDSRVQDRIGFYRRYCGILGVSPGENLDCGNQRSFGNGLLVDIMQNCQCDTTIYCCSQHGYCGNSYDYCGPGCQAGPCWDPCEGDGTLTVSDIVTQEFWDGIASQAAANCPGKSFYTRSNFLEAVSAYPGFGTKCTDEDRKREIAAYFAHVTHETGHLCYIEERDGHANNYCQESQQYPCNPNKEYFGRGPMQLSWNYNYIDAGKELHFDGLNDPDIVGRDPIISFKTSLWFWIRKGVQYVILDPNQGFGATIRIINGGQECDGHNTAQMMARVGYYQEYCAQLGVSPGNNLPCMKKNRMMMMIWSVGVVWMLLLVGGSYGEQCGRQAGGALCPGGNCCSQFGWCGSTTDYCGPGCQSQCGGPSPAPTDLSALISRSTFDQMLKHRNDGACPAKGFYTYDAFIAAAKAYPSFGNTGDTATRKREIAAFLGQTSHETTGGWATAPDGPYAWGYCFVRERNPSTYCSATPQFPCAPGQQYYGRGPIQISWNYNYGQCGRAIGVDLLNKPDLVATDSVISFKSALWFWMTAQSPKPSSHDVITSRWTPSSADVAARRLPGYGTVTNIINGGLECGRGQDSRVQDRIGFFKRYCDLLGVGYGNNLDCYSQTPFGNSLLLSDLVTSQMRSLLILVLCFLPLAALGKVFGRCELAAAMKRHGLDNYRGYSLGNWVCAAKFESNFNTQATNRNTDGSTDYGILQINSRWWCNDGRTPGSRNLCNIPCSALLSSDITASVNCAKKIVSDGNGMNAWVAWRNRCKGTDVQAWIRGCRLMKALIVLGLVLLSVTVQGKVFERCELARTLKRLGMDGYRGISLANWMCLAKWESGYNTRATNYNAGDRSTDYGIFQINSRYWCNDGKTPGAVNACHLSCSALLQDNIADAVACAKRVVRDPQGIRAWVAWRNRCQNRDVRQYVQGCGVMKAFIVLVALACAAPAFGRTMDRCSLAREMSNLGVPRDQLNKWACIAEHESSYRTGVVGPENYNGSNDYGIFQINDYYWCAPPSGRFSYNECGLSCNALLTDDITHSVRCAQKVLSQQGWSAWSTWHYCSGWLPSIDDCFKIFSKCELARKLKSMGMDGFHGYSLANWVCMAEYESNFNTQAFNGRNSNGSSDYGIFQLNSKWWCKSNSHSSANACNIMCSKFLDDNIDDDIACAKRVVKDPNGMSAWVAWVKHCKGKDLSKYLASCNLMTKYVILLAVLAFALHCDAKRFTRCGLVQELRRLGFDETLMSNWVCLVENESGRFTDKIGKVNKNGSRDYGLFQINDKYWCSKGTTPGKDCNVTCNQLLTDDISVAATCAKKIYKRHKFDAWYGWKNHCQHGLPDISDCKVYDRCEFARILKKSGMDGYRGVSLANWVCLAKWESDFNTKAINRNVGSTDYGIFQINSRYWCNDGKTPKAVNACHISCKVLLDDDLSQDIECAKRVVRDPQGIKAWVAWRTHCQNKDVSQYIRGCKLMKAVIILGLVLLSVTVQGKIFERCELARTLKRLGLDGYRGISLANWVCLAKWESDYNTQATNYNPGDQSTDYGIFQINSHYWCNNGKTPGAVNACRISCNALLQDNIADAVTCAKRVVRDPQGIRAWVAWRNHCQNRDVSQYVQGCGVKIYEQCEAAREMKRLGLDGYDGYSLGDWVCTAKHESNFNTGATNYNRGDQSTDYGIFQINSRWWCNDGKTPNAKNACGIECSELLKADITAAVICAKRVVRDPNGMGAWVAWTKYCKGKDVSQWIKGCKLMSALWLLLGLLALMDLSESSNWGCYGNIQSLDTPGASCGIGRRHGLNYCGVRASERLAEIDMPYLLKYQPMMQTIGQKYCMDPAVIAGVLSRKSPGDKILVNMGDRTSMVQDPGSQAPTSWISESQVSQTTEVLTTRIKEIQRRFPTWTPDQYLRGGLCAYSGGAGYVRSSQDLSCDFCNDVLARAKYLKRHGFRTDCYGNVNRIDTTGASCKTAKPEGLSYCGVSASKKIAERDLQAMDRYKTIIKKVGEKLCVEPAVIAGIISRESHAGKVLKNGWGDRGNGFGLMQVDKRSHKPQGTWNGEVHITQGTTILINFIKTIQKKFPSWTKDQQLKGGISAYNAGAGNVRSYARMDIGTTHDDYANDVVARAQYYKQHGYMVPSVVFWGLIALVGTAKGSYTHSVHSMNPHVHPRLYHGCYGDIMTMETFGAPCDINNLMNCGIHGSEMFAEMDLKAIKPYRILIKEVGQRHCIDPALIAAIISRESHGGAVLQNGWDHKGQRFGLMQLDKNMYHPIGSWDSKEHLLQSVGILTERIKAMKRKFPTWNTAQQLKGGLTAFKSGMETIVTPADIDGDLVDDVLARAKFYKRHGFMGYGNIMNVETTGASWQTAQQDKLGYSGVRASHTMANTDSGRMERYRSKINSVGAKYGIDPALIAAIISEESRAGNVLHDGWGDYDSNRGAYNAWGLMQVDVNPNGGGHTARGAWDSEEHLSQGAEILVYFIGRIRNKFPGWNTEQQLKGGIAAYNMGDGNVHSYDNVDGRTTGGDYSNDVVARAQWYKTQKGFMPYGKIEDIKTSGASDVTAAQDGLKEGGWKSSHRMAEIDSNRMENYRTIINEAGRQCDVDPAVIAGIISRESRAGNQLINGWGDHGKAFGLMQIDVTPPPNGGGHTPVGTWDSLEHLIQATEILVEFIERIKTKFPRWNADQHLKGALAAYNKGEKNVESYASVDAKTTGKDYSNDVVARAQWYKSNMGFMKCLVALFLSLSLVACQYDDYDTERKNNNMLSSMNILDLLDSFGLNIKARIAHVRRVAGRIRLTLDIGLGNGDVERESEEAEGEGTDGRGGGEGEREGWGGEREGGEGEREGGEGEREGREGEREGKSSESNESPEDFIGPPVDMCAGESRRGSPSIGCIAAECCQHSFYINSLCPGSSVCCFSMDVCDRLPVPVIPPFPTDPGTLPPPPPIPDSQTTVSPNQPSSYMCHGDFMKLMPKGADQRTARQDNLAYAGVRASNKLVDNDLAELNKRKDCYVQAGKNHCIHPAVIAAIASRETRGGKLLYSTNGYGDGGRAYGIMQCDGGASGLGDICKKYPWDSCEHINQLTDIILLNYVNQMKTKHPSWPAHYQLKGGVSAYNAGVGNVQTIAGMDAGTTNDDYSNDVIARAQRLVNAHGWMLGKNDPMCLVLVLLGLTALLGICQGGTGCYGSVSRIDTTGASCRTAKPEGLSYCGVRASRTIAERDLGSMNKYKVLIKRVGEALCIEPAVIAGIISRESHAGKILKNGWGDRGNGFGLMQVDKRYHKIEGTWNGEAHIRQGTRILIDMVKKIQRKFPRWTRDQQLKGGISAYNAGVGNVRSYERMDIGTLHDDYSNDVVARAQYFKQHGYMHLMLVLLGLAALLGTSQSRTGCYGDVNRVDTTGASCKSAKPEKLNYCGVAASRKIAERDLQSMDRYKALIKKVGQKLCVDPAVIAGIISRESHAGKALRNGWGDNGNGFGLMQVDRRSHKPVGEWNGERHLMQGTEILISMIKAIQKKFPRWTKEQQLKGGISAYNAGPGNVRSYERMDIGTTHDDYANDVVARAQYYKQHGYMNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNCNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRCALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNLMEMISNNLNWFVGVVEDRMDPLKLGRVRVRVVGLHPPQRAQGDVMGIPTEKLPWMSVIQPITSAAMSGIGGSVTGPVEGTRVYGHFLDKWKTNGIVLGTYGGIVREKPNRLEGFSDPTGQYPRRLGNDTNVLNQGGEVGYDSSSNVIQDSNLDTAINPDDRPLSEIPTDDNPNMSMAEMLRRDEGLRLKVYWDTEGYPTIGIGHLIMKQPVRDMAQINKVLSKQVGREITGNPGSITMEEATTLFERDLADMQRDIKSHSKVGPVWQAVNRSRQMALENMAFQMGVGGVAKFNTMLTAMLAGDWEKAYKAGRDSLWYQQTKGRASRVTMIILTGNLESYGVEVKTPARSLSAMAATVAKSSDPADPPIPNDSRILFKEPVSSYKGEYPYVHTMETESGHIQEFDDTPGQERYRLVHPTGTYEEVSPSGRRTRKTVDNLYDITNADGNFLVAGDKKTNVGGSEIYYNMDNRLHQIDGSNTIFVRGDETKTVEGNGTILVKGNVTIIVEGNADITVKGDATTLVEGNQTNTVNGNLSWKVAGTVDWDVGGDWTEKMASMSSISSGQYTIDGSRIDIGMPPSLRKAVAAAIGGGAIAIASVLITGPSGNDGLEGVSYIPYKDIVGVWTVCHGHTGKDIMLGKTYTKAECKALLNKDLATVARQINPYIKVDIPETTRGALYSFVYNVGAGNFRTSTLLRKINQGDIKGACDQLRRWTYAGGKQWKGLMTRREIEREVCLWGQQMVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTGAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIAKFKEAGGTVREIDVMKGKTAAGGGAICAIAVMITIVMGNGNVRTNQAGLELIGNAEGCRRDPYMCPAGVWTDGIGNTHGVTPGVRKTDQQIAADWEKNILIAERCINQHFRGKDMPDNAFSAMTSAAFNMGCNSLRTYYSKARGMRVETSIHKWAQKGEWVNMCNHLPDFVNSNGVPLRGLKIRREKERQLCLTGLVNEMMQISSNGITRLKREEGERLKAYSDSRGIPTIGVGHTGKVDGNSVASGMTITAEKSSELLKEDLQWVEDAISSLVRVPLNQNQYDALCSLIFNIGKSAFAGSTVLRQLNLKNYQAAADAFLLWKKAGKDPDILLPRRRRERALFLSMQISQAGINLIKSFEGLQLKAYKAVPTEKHYTIGYGHYGSDVSPRQVITAKQAEDMLRDDVQAFVDGVNKALKVSVTQNQFDALVSFAYNVGLGAFRSSSLLEYLNEGRTALAAAEFPKWNKSGGKVYQGLINRRAQEQALFNSGTPKNVSRGTSSTKTTPKYKVKSGDNLTKIAKKHNTTVATLLKLNPSIKDPNMIRVGQTINVTGSGGKTHKVKSGDTLSKIAVDNKTTVSRLMSLNPEITNPNHIKVGQTIRLSMKVSQNGLNLIKEFEGCRLTAYKPVPWEQMYTIGWGHYGVTAGTTWTQAQADSQLEIDINNKYAPMVDAYVKGKANQNEFDALVSLAYNCGNVFVADGWAPFSHAYCASMIPKYRNAGGQVLQGLVRRRQAELNLFNKPVSSNSNQNNQTGGMIKMYLIIGLDNSGKAKHWYVSDGVSVRHVRTIRMLENYQNKWAKLNLPVDTMFIAEIEAEFGRKIDMASGEVKMVKKNDLFVDVSSHNGYDITGILEQMGTTNTIIKISESTTYLNPCLSAQVEQSNPIGFYHFARFGGDVAEAEREAQFFLDNVPMQVKYLVLDYEDDPSGDAQANTNACLRFMQMIADAGYKPIYYSYKPFTHDNVDYQQILAQFPNSLWIAGYGLNDGTANFEYFPSMDGIRWWQYSSNPFDKNIVLLDDEEDDKPKTAGTWKQDSKGWWFRRNNGSFPYNKWEKIGGVWYYFDSKGYCLTSEWLKDNEKWYYLKDNGAMATGWVLVGSEWYYMDDSGAMVTGWVKYKNNWYYMTNERGNMVSNEFIKSGKGWYFMNTNGELADNPSFTKEPDGLITVATVQGFDISSYQPSVNFAGAYSAGARFVIIKATEGTSYTNPSFSSQYNGATTATGNYFIRGGYHFAHPGETTGAAQADYFIAHGGGWSGDGITLPGMLDLESEGSNPACWGLSAASMVAWIKAFSDRYHAVTGRYPMLYTNPSWWSSCTGNSNAFVNTNPLVLANRYASAPGTIPGGWPYQTIWQNSDAYAYGGSNNFINGSIDNLKKLATGMKGIDIYSGQGSVDFNAVKESGVEVVYIKATEGLTYTDSTYKDFYDGAKNAGLKIGFYHYLRANDPTSEAEHFFNTISGLSLDCKCAIDVEVTLGQSIDQISSNVRKFADYLINKGLDVCVYTYTNFYKDNLNSTVKDLPLWIAEYGVSKPNIDASYVGFQYSDSGSVNGISGSADLDEFSEGILVGGTVVIDPGQGGDDNIKAIQQDLNILLKRGLEVDGIEGPETEAAIKDFQSIMGLTVDGIWGTNTSGAAQQIFSRPLDGVAYPHYEYATRYIQYRVGASVDGTFGSGTKAKVAAWQSNQGLMADGVVGSATWSKLLDENKLGIDVSQPTSTSSFTCLRNKGFTTMVIVRAWKSTGSFDTNAPQTLKNANAAGFSIENSDVYYYPCISCGNMAGQVRTFWQKVGQYSLKVKRVWFDIEGTWTSSVSTNQNYLMQMMNEARAIGIVHGIYGSKYYWGNLFGSSYKYRYRSSTPLWYPHYDNSPSFSDFSSFGGWTSPSMKQYRGDVSVCSAGVDYNYKPMPAYSSLARRGRRPAVVLLGGLVSASLALTLAPTAAAAPLAPPPGKDVGPGEAYMGVGTRIEQGLGAGPDERTIGPADTSGVQGIDVSHWQGSINWSSVKSAGMSFAYIKATEGTNYKDDRFSANYTNAYNAGIIRGAYHFARPNASSGTAQADYFASNGGGWSRDNRTLPGVLDIEHNPSGAMCYGLSTTQMRTWINDFHARYKARTTRDVVIYTTASWWNTCTGSWNGMAAKSPFWVAHWGVSAPTVPSGFPTWTFWQYSATGRVGGVSGDVDRNKFNGSAARLLALANNTAMTKTYGVDVAVYQPIDLAAYHKAGASFAIVKLTEGVDYVNRRGPSRWTAPGLTTSTLMPTISRSFGSSVSRAKKEAAYFLKEAKKQDISKKRMLWLDWEAGSGNVVTGSKSSNTAAILDFMDAIKAAGWRPGLYSGASLMRTAIDTKQVVKKYGTCLWVASYPTMAAVSTADFGYFRQWTGSPSGSLPVTAWPGRRRERCSGMQLRITSRKKLTSLLCALGLISIVAIYPRQTVNFFYSTAVQITDYIHFYGYRPVKSFAIRIPASYTIHGIDVSRWQERIDWQRVAKMRDNGIRLQFAFIKATEGEKLVDPYFSRNWQLSRENGLLRGAYHYFSPSVSASVQARLFLQTVDFSQGDFPAVLDVEERGKLSAKELRKRVSQWLKMVEKSTGKKPIIYSGAVFYHTNLAGYFNEYPWWVAHYYQRRPDNDGMAWRFWQHSDRGQVDGINGPVDFNVFNGTVEELQAFVDGIKETPMRFIALLISFFALLKVISAISGVDISSASTIESFTCLKSAGYDFAIIRAYESLGQVDPNGPHSVYNARDAGIEYVDVYMFPCPTCGNGAGQAETMVNYLKGYNANYGMVWLDIEGPQYWMSQSENVAFFESLVAGLKAEGAHIGVYTSASQWEPIMGGYTGGSEFPLWYAHYDGNPSFSDFSPFNGWSTPSVKQYDDTGDSCGLGFDLNWYPMHCAPSWKSSDERRTMLDQINTLDPNSLTALKRMSKDNSPAAIKGAAQQFEALFLQNMLKSMRDATVTSDAMGSETTRFYQGLYDQQLAAMMAQRGGIGLADVMEKQMGAQAASAQNAAAAGASSAGNVPLSLDAARAAAAHTASGDKVPTTPQAFVDATWPQAAKAAQSLGVPAHFLVAQAALETGWGKSQIRNKDGTPSYNLFNIKAGSNWTGKVVEARTVEYENGQRKVRVERFRAYDSYEQAFQDYADLVGNSPRYAKVAGKTDGHAFARALQEGGYATDPSYADKLARVINGNALRQRLMASAASARGMINKKWMKIVMIPMLVVPMYGLTSVSGQIQDSLTGENSFVKDAEAATTASQQAFIDKIAPAAQASQEQYHLLSSITLAQAILESGWGKSGLATKGYNLFGIKGKYNGQSVIMSTSEYVNGQWIKIDAEFRKYPSWNESVTDHTLLLVNGTSWNKNLYKKVVDATDYKVAAMELQKAGYASPTYGASLIQVIENYDLAKYDVLYDKILTQKSTSGKATVTSPTGNGVWTLPYKVKGVQSVSPASTYANKDIDLVSVATTKRGTYYQFKYNGKVVGWVDAKALTIYDSVNYDKVNVGRAKITSPVSNGIWSKPYNVYGREFVTNATTYAQQEIKLLREAQTAKGTYYQFSINNKTIGWIDKRALTIYPYDSIVSSKNVSLDGQITNPTGNGIWTKAYKLEGTTSVAQATKYANKDVKISQQVETQHGTYYNISIDGKAIGWLDKNAITLYDQAEYNKTVAFDAAIRNVQGNAVWTEPYRTVGTKLIGPAETYLNKEVEVVREAKTPKGTYYQFKSGGKVIGWLDKKAFEVYDNINYNKAVNLDAVVENVTGNAVWTAPYKSKGVKLVTSAATYKGKATKITREAQTSRGTYYEFSVNGKVIGWLDKKAFDVYDSIEYNKAINMTGLLSNAPGNGIWTEPYRVLDTKNIGQATAYANKTVQLVREAKTSHSTYYQMSLNGKVIGWIDKRAFTNVKMVNTQVKRVKKQKFIAGTALLLGMATFGMVGKADDLSSSNTNGGVDNSKVDNDNQESVKTSTEGVSSTTENANTVPESKVTSTVDSESAPSKTISAGTQSNISGTSDGSDSLPKTETSDSSSKPSTSNSSSKPSTSNSSSKPSTSNSSSNNNSATKPSTTTQAPPVAPSTTAPSATPSTTAPSNYYQNSSYNQTSTAAQIPNSSSDSAASVYSGPVLKKIEAAKPIEKIDSSSTEAFIKSIADRVRILAGKNNLYASIILAQAILESGSGQSNMTQQYFNIFNITGAYLGKSISFKTEEFSGNNPYYIEQSFRVYSNYDQALDDYINLMIKGTTWNSEIYAGAWKSHAKTYQEAAQALQGIFATDPEYAQKLIEIIEEYNLNFYDNVDSTTQVLDSNIPESPLVASKLDSSTYPDYNGVEYPGADSYAFGNCTQYVYNRIIQLGGQIGTHMGNGGEWGINAQAQGYFTTTVPTEGYAVSFPPGVAGSSPEYGHVAFVEKVYPDNSILVSEMNVKGNNIVSERHISAGVAALATYIQPKMNRNRLSCLIVGAVIGAGAIVCTTNTKVHAKPVNEVKNINTSKGNSFGEIISSEDIGLRKGADSSHEIITSIPSGARVNIIDKMSKDWYKVSYKDFTGYLQAKDIRVLGDELNQDNVGLISANQLNVRTSPNENGQVIGTLHKNDKVNVLDKSIDGWYKIDFNGRRAYVSSKYVNLISYKNNEVKTEVKKEPIEGTGKVNINTALNVRQASTTNSRIIGSLKGGEKVNIISESNGFYKIEFNNSYGYVYSKYISKDGDSEKVQVVKQEEVKKEKVDESKKEAKATPKAEPVVLAVRSLNKTGIVNVSSSLNVREGAGTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESSNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSAPENTEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKVIIVGEEGAFYKIEYKGSHGYVAKEYIKDVTESNNSNQGTQTPEKPSTPESTEKTGIVNVSSSLNVREGASTSSKVIGSLSGNTKVTIVGEEGAFYKIEYKGSHGYVAKEYVKDVTESNNSNQGTQTPEKPSTPESAEKTGVVNVSSSLNVREGASTSSKVIGSLSGNTKITIVGEEGAFYKIEYKGSHGYVAKEYIKDIKDEVVTEPEKPSTHENSKKTGVVTASKGLNVRKEANTSSQIIGILNSGESVEIIGEENGFYKITYKGQEAYASKNYINIFDGNSNVNPGLDIGNASKTNYGVSLNEYIKLQQRNNPSNYSYSEFEKYINPAKATNKLQFLRIDKFRSVNVSGLSSRLSNKGVLTGQGQAFVNAAKAFNIDPIYLVAQCLHETGNGTSKLAKGVTITEIADESKPIYNGNGQLVGYHMIKLSKPVTVYNLFGIGAKDNSSVFPNRALILGTTYAYNRGWTSIENAIKGAAEFVSLNYVHSSRYSQNTLYKMRYNQNVSNIWHQYATTPWYASSIADIMRSYQDLYLENNFTFDVPVFAGMKKESMSRIERRKAQQRKKTPVQWKKSTTLFSSALIVSSVGTPVALLPVTAEATEEQPTNAEVAQAPTTETGLVETPTTETTPGTTEQPTTDSSTTTESTTESSKETPTTPSTEQPTADSTTPVESGTTDSSVAEITPVAPSATESEAAPAVTPDDEVKVPEARVASAQTFSALSPTQSPSEFIAELARCAQPIAQANDLYASVMMAQAIVESGWGASTLSKAPNYNLFGIKGSYNGQSVYMDTWEYLNGKWLVKKEPFRKYPSYMESFQDNAHVLKTTSFQAGVYYYAGAWKSNTSSYRDATAWLTGRYATDPSYNAKLNNVITAYNLTQYDTPSSGGNTGGGTVNPGTGGSNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSGSGGSNNNQSGTNTYYTVKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFVGQKLIVKKGASGNTGGSNNGGSNNNQSGTNTYYTIKSGDTLNKIAAQYGVSVANLRSWNGISGDLIFAGQKIIVKKGTSGNTGGSSNGGSNNNQSGTNTYYTIKSGDTLNKISAQFGVSVANLQAWNNISGSLIFAGQKIIVKKGANSGSTNTNKPTNNGGGATTSYTIKSGDTLNKISAQFGVSVANLRSWNGIKGDLIFAGQTIIVKKGASAGGNASSTNSASGKRHTVKSGDSLWGLSMQYGISIQKIKQLNGLSGDTIYIGQTLKVGMKKRLIAPMLLSAASLAFFAMSGSAQAAAYTDYSLYKVEPSNTFSTESQASQAVAKLEKDTGWDASYQASGTTTTYQISASGIHSESEAKAILSGLAKQTSITGTSSPVGSKQPYVTISSGAISGEKQANTILAKLKQETGVAGAVKAYGAAQPYMNVMTSDIADETKVKALIQSLAKQTGIKSSYQPITHTVSVTTIQSGTIVGDSRAAQIKNAFQKESGLQASLKETVKGQAYYTFTTAAISGEANAKTLLQQLKQSTGITGSYKSINQKTTVESYNVQSAYFKGLSTVKDAISQIKKNTGVSGSYQQVGKSTSYTVNMKGITKQQLQKIDTFFKKKKWHYTSSSVKKTTTSAAYQITTAKILGEQQANKAAAFFAQKKVKAAKTAAGSTAENQYQLISEETSDQAKVTKGLNILKKNQLSASAKSVKKQIADTFKITTESLLDQTKVNQALTFFKSNHISVASQKTGQTAASSYQITTEAIISQEEIDRVLTFFKQNHIAVTTSKTGQTAYTQYKIVTTQLSSKTALNNGLTYLKSKSVTPSYTTKSNTLYKISVNEQFTGNDTAAAASTKLKQLYGWTSSIVKIKNGPQIMKTNYNLSLRDMVQKQMTVSPQTDGAAYVSLTYINTATSTVTADVLNIRSTPEVSPTNVIGQFKKGDKVKVIGQINGWAKINLGWRNASSDEVVQYVDPNNFSRDSKYYFQFLKLSQTAGLSVTEVNQKVLAGKGILTGRAKAFIDAANQYSINELYLISHALLETGNGTSALANGLTYNGKTVYNMYGIGAYDSNPNYYGAKYAYEQGWFTPEAAIIGGAKFIGSSYIHNTAYNQDTLYKMRWSATATHQYATDIGWAYKQVNRMYSLYSLLDGYTLYFDVPEYRMARKKLKKRKLLISLFFLVSIPLALFVLATTLSKPIEISKETEEIDEQQVFIDSLSGHAQILYEKYHVLPSITIAQAILESDWGNSELAAKANNLFGVKGNYKGHHVTMETDEVEKGKRKTIRAKFRKYSTFFESMDDHAQLFVRGTSWNKKKYKPVLEAGNYKEAATALQTSGYATDPDYADKISAIVEKYDLDEYDEVNPSLKSVDLNASIKDSAVQDVWSKPSTDDRSIRLTSAQSYVGKDIKVVSKKQKGQSVWYQFQINDKLIGWIDDSAVEIKEATMARKLIKNLGKSKSVKRVKLLFKKIFITVFIVASIVAIFNITKYFEELYKVRDLKSTKIEYYMDVADEAGDGKVQLSWKALLAIDMVIHDEDLSNIKKKDTLDIGEKFIVEDKNDKGEKVYKVKKFNKVLSELKFDSSQKSRARKYMKDLEYTYLGNKQLDSSDEKIKFIKKLEDSAIREYIDYGILPSITIGQAILESGWGNSKLTKQSNNLFGIKADKAWKGKSVEISTSEHYNEKIVASFRSYNSLQDSVKDHSLFLINNKRYRKHGLFEAKDYISQAQALENAGYSTAEDKKGNRIYAELLIDVIRSYNLQLIDNKVETKMFFLTLPLLLGCTAATTPLTAATPPVDPLPLKVVSTDQLPKGLAKDQQLWNKVNGQKGDYKALLTAIDHSLEYLGTDKAQKDYQDYKVPGITRDRVSRSLRRFRQLVVQAKSPQALETAVKKEFQFYQSIGNDQKGNVDFTGYYEATYPASRQPTTEFRYPLYQAPADLKAWPKPHPTRAELEGADGLQASQGPLKGLELVWLRDRIQAFLVQVQGSARLGLTDGTEMTVGYAGKTAHPYTSIGKALIADGKFTLEELSLPVVLQYFEENPQDLDLYIPKNKSFVFFQETFGSPPMGNLNVPVTDERSIATDKSLMPPGALALIQTNLPYYNASQTLEFKDVSRFVLDHDTGSAIKGPGRVDIFMGTGAKAKERAGVMTGSGQLYYLLLKDNMNTPFSIDEVSFRDLPGWGQDDPRKLFPAMATILSHLRNAKPYRTGALGITAAELVSLLELAERGQVNSPEQARQFFETNSVPFRISPAQGKSGFVTAFYEPELEVSATPDDVWRYPIYRRPPELVDIDNDNRPDGFDPSYAFGKADEEGISYFPDRRAIDEGCLRGRGLEIAWARSKVDLFFVHVQGAARLVFPDGAIKRITYAAKAGHVFSPIGRLLLDRGELDPKTISMQTIRQWLADHPDEVDGVLWHNRSYIFFREADVAGLDMGPIAAAKVPLVAGRALAVDRLIHTFGLPFFIHAPTLTHLDDGKPFARLMLALDTGSAIVGPARGDIFTGSGFEAGELAGTVRNEADFYILLPRIAAERYRRMRKIQVAVFLFVGLLAACSTVPPSSAPTTCAQCQPCPACPAVTPAITPAPAPAFSRSLLPASWGDLPGWAEDDVTAAWPAFMQSCRGIASRGNAAGWRRVCELARAADGKPENDVRRFFERHLKPYAIVNGDGLVSGLVTGYYEPMLRGSRTKAKGYEQPVRGVPDDLLTIDLSAVFPELKDKRVRGRLEGNKVVPYWSRAEIAARGDKLPGKTLLYVDDAVELFFLQVQGSGRVKLADGGMVRLNYADQNGYQYQSIGKALVERGELKLEEASMQGIQAWARANPARLESLLNTNPSYVFFREVANSADGPVGALGVPLTAERSIAIDPRSVPLGSPVFLATTRPNSAVPLNRLVMAQDTGGAIKGGVRADFFWGFGKEAGDQAGRMKQSGRMWILLPTELAPKMKGRWVKYLLMGTVVAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQINHIRNSSPRLYGNQSNVYNAVQEWLRAGGDTRNMRQFGIDAWQMEGADNYGNVQFTGYYTPVIQARHTRQGEFQYPIYRMPPKRGRLPSRAEIYAGALSDKYILAYSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGHAYRSIGKVLIDRGEVKKEDMSMQAIRHWGETHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLVGRASVASDRSIIPPGTTLLAEVPLLDNNGKFNGQYELRLMVALDVGGAIKGQHFDIYQGIGPEAGHRAGWYNHYGRVWVLKTAPGAGNVFSGMKKYLFRAALCGIAAAILAACQSKSIQTFPQPDTSVINGPDRPVGIPDPAGTTVGGGGAVYTVVPHLSLPHWAAQDFAKSLQSFRLGCANLKNRQGWQDVCAQAFQTPVHSVQAKQFFERYFTPWQVAGNGSLAGTVTGYYEPVLKGDDRRTAQARFPIYGIPDDFISVPLPAGLRSGKALVRIRQTGKNSGTIDNTGGTHTADLSQFPITARTTAIKGRFEGSRFLPYHTRNQINGGALDGKAPILGYAEDPVELFFMHIQGSGRLKTPSGKYIRIGYADKNEHPYVSIGRYMADKGYLKLGQTSMQGIKAYMQQNPQRLAEVLGQNPSYIFFRELTGSSNDGPVGALGTPLMGEYAGAVDRHYITLGAPLFVATAHPVTRKALNRLIMAQDTGSAIKGAVRVDYFWGYGDEAGELAGKQKTTGYVWQLLPNGMKPEYRPMKFPFHPWRRLLLCALPFAALLTACDDGKKEPPPTPAEVTTYNSVPWDALPATSDADLLAGFNAWRSACARLAKDPVWGEPCASATTVAADPTAVRAFLQERMQVYSLRSSSNGDQGLITGYYEPVYHGSLSQGEKTPVPVYGVPDDLVVVALESVYPELKGKRLRGRLEGRVLKPYDDAATIRDNGSSAPVLAWLGDPMDLQFLQIQGSGRIQLEDGRQLRIGYGDQNGHPYKPVGRWLVEQGLVPKEEISMKRIRDWAEANPQRVSELLASNPSFVFFSLRPDSDEGPRGSLNVPLTDGYSVAIDRKVIPLGSLMWLSTTRPDDGSAVVRPVAAQDTGGAIVGEVRADLFWGTGDAAGELAGHMKQPGRLWLLWPKGAPLPASMGAMNGTSGRRLSTATRVAAMAGVLLLAACGGPSSRPGLVSRPAGVAGPVSYQRVAIEGLPGWSTDRVADALPVFRRSCERLRAVSPNSMVGPSVWGSRASDWQAACAVAARLPAFDDDAARRFFAERFQAWQVTGAGDPTGLFTGYYEAALDGSLSPSAVYSTPIYGVPLDLRMEGGKGMRVSGGRSLPYPDRAAIEEGAISGVAPVIMWARDPVDVFMLHIQGSGQVRLPDGRIQRIGYAANNGHPFVGIGAIMRDRGLGDGSSMIAIRAWLRANPAEGRALMRENPRFIFFRPIEGEGPIGAQGLPLTGGRSLAVDPSSVPLGAPVWLATSDAHGETVNRLMVAQDTGSAIKGAVRGDFFWGSGEEALYHAGGMKSAGRYWVLVPRGGRNAVAQNMKGRWAKYVATGVMLAMLAACSSKPTDRGQQYKDGKFTQPFSLVNQPDAVGAPINAGDFAEQVNQIRSASPRLYTNQSNVYNAVQNWLRSGGDTRTMRQFGIDAWQMEGTDNYGNVQFTGYYTPVVQARHTRQGAFQYPIYSMPPKRGRLPSRAQIYAGALSDKYILAWSNSLMDNFIMDVQGSGYIDFGDGSPLNFFSYAGKNGWPYRSIGKVLIDRGEVKKEDMSMQAIREWGEKHSEAEVRELLEQNPSFVFFKPQSFAPVKGASAVPLIGRASVASDRSIIPPGTTLLAEVPLLDNNGKFSGQYELRLMVALDVGGAIKGQHFDIYQGIGPDAGHRAGWYNHYGRVWVLKSAPGAGNVFSGMFKRRYVTLLPLFVLLAACSSKPKPTETDTTTGTPSGGFLLEPQHNVMQMGGDFANNPNAQQFIDKMVNKHGFDRQQLQEILSQAKRLDSVLRLMDNQAPTTSVKPPSGPNGAWLRYRKKFITPDNVQNGVVFWNQYEDALNRAWQVYGVPPEIIVGIIGVETRWGRVMGKTRILDALATLSFNYPRRAEYFSGELETFLLMARDEQDDPLNLKGSFAGAMGYGQFMPSSYKQYAVDFSGDGHINLWDPVDAIGSVANYFKAHGWVKGDQVAVMANGQAPGLPNGFKTKYSISQLAAAGLTPQQPLGNHQQASLLRLDVGTGYQYWYGLPNFYTITRYNHSTHYAMAVWQLGQAVALARVQMFALTAYRLRCAAWLLATGIFLLLAGCSEAKAPTALERVQKEGVLRVITRNSPATYFQDRNGETGFEYELAKRFAERLGVELKIETADNLDDLYAQLSREGGPALAAAGLTPGREDDASVRYSHTYLDVTPQIIYRNGQQRPTRPEDLVGKRIMVLKGSSHAEQLAELKKQYPELKYEESDAVEVVDLLRMVDVGDIDLTLVDSNELAMNQVYFPNVRVAFDFGEARGLAWALPGGDDDSLMNEVNAFLDQAKKEGLLQRLKDRYYGHVDVLGYVGAYTFAQHLQQRLPRYESHFKQSGKQLDTDWRLLAAIGYQESLWQPGATSKTGVRGLMMLTNRTAQAMGVSNRLDPKQSIQGGSKYFVQIRSELPESIKEPDRSWFALAAYNIGGAHLEDARKMAEKEGLNPNKWLDVKKMLPRLAQKQWYAKTRYGYARGGETVHFVQNVRRYYDILTWVTQPQMEGSQIAESGLHLPGVNKTRPEEDSGDEKLMIGADTAKECDAMTFKLLPLAVLCAALVGCQSAQSRDARAESPATAESAAPTAEAPVSEAQEADFETWLANFRRQARGEGIDEATLARALDGLRYRPRVIELDGSQPEFVRPIWEYLDSAVSASRVKKGRERLAEYRDTVRQMTERYGVPGEVLVAIWGIESSYGDYLGDFSTLEALATLAYDGRRRDFARGELLAALRIIEAGDISPERMKGSWAGAMGHTQFIPSSFLAHAVDGDGDGRRDIWNSIADVLASTANYLDEAGWREGEPWGTEVSLPQGFDYTLTEPDIRRSSAEWAAAGVRSRDGHALPDFASASVIAPAGAQGPVFLVGHNFRVILRYNNATSYALAVATLSDAIAGRAGIQGEWPREQPALKRSEVREMQQLLDARGFDVGTPDGILGPNTRRGLRAFQREIGVTPDGFATKALLERLRRMPGLPRARMAQWHPLYSVRLAKDTMTDTQRSLRRPLLGAALSAAALGLCGLSPSLLAAGKRRVSLREEEIEPGRYRDNPQARAFIDEMVARHGFDRGMLQDWFGQAVYSATVVRLIMPPATTGRKSWRTYRSRFIEPIRINAGVRFWQDNRDTLRRAEAEFGVPASVIVGIIGVETIYGRDMGSFRVLDSLSTLAFDYPATPNREARSTLFRNQLADYLLWCRDTRTDVYSVLGSYAGAIGIPQFMPTSLREYALDYDNNGHIDLRNSPTDAIGSVARFLQLHGWEPGRPVVWRIAPDDGSLGVATAAADGEPWPTRTLNQLTRAGLRVDEPINLAREGETGVLVVDLPTPDQPTEYLLGLRNFYVLTRYNRSFFYALAVYQLGEAVKAAMGMFGILNRREMLRGTAATLLLPGILTSAHAGQVAEDPLLRYPWLAQWAGADGLDAPWLRGVFQNLKKYPRVIRAMNHQAEAKPFYLYREHVTSPWLYKKGREAWQQHRAMLEAAGARYGVDAPFVLALWGMESRFGRNQGEHPVLRTLFTLAVDYPRRQTFFRQELRHFLILCRQQGWDPMLLKGSYAGAMGHVQMIPSSLRYYAVDGDGDGRLDVFNNPMDATASIAHYLGKHGWELGGPYLIPVYGITDLSAIKSAKVKEMQPWSSWYALGVRTRGEPPPAERAMALIALEEQDGLRYYGVFNNFRVILDWNRSTRFAKVVGELAEGFVLMPTPATRASLIGLALASGLLAGPARADFQSCLAGIQAQAAGAGVSAQTFRAATANIAYDDKVIELSQAQPEFKTPIWDYMSALVDEERVEDGRAAMRQHAQALANAEARYGVDRHTIAAVWGVESNFGKNLGKMPLVQSLATLACSSNRRRDFFRSELIATLKIIERGDIEASRLTGSWAGAFGQTQFMPTTYQRLAVDGDGDGRRDVVDSVADAVASTANFLRVAKWSNGQPWGYEVRLPRGFNVAAAGRKNKHAVGHWASLGVTRVDGKALTGDGPAGIIAPAGINGPAFLVTKNFDAIYSYNAAESYGLAIAVLSDRLRGRPGVQADWPTDDPPLSRAERRDLQTRLTARGYDVGEPDGKVGSKTREAIKEIERQLGMPATGRPGGKVLEALRRGMFKYSFIAVIVSTVLLSACADSHQKSAEKKPVTSEIANIATSAPARWKQIDVVSLEQAFPKQSRTPAQFPAYVDALKQKAAELGYKPETINFAFSEIHFIDRVVKSDRNQPEKKITLDVYLPRVVTKGRIAEGAKLYQANQQTLAQISNQYGVPANYIVALWGLESGFGRVQGKEDVISALATLAFEGRREALFSRQLMAALEIIENGHLPVGQRLKGSWAGAMGQTQFMPSSFLTYAADGNGDGNIDIWNSREDAFASAANYLATEGWQRDLPWGEQVSLPANFNQQLEGIKTEQQKTVAQWKALGVQLPANSQLSDDMKVWLIIPDDDLHRSYLVTQNFRTIMHWNSSYFFALSIVTMADGVANKINTLPTQHMKKESRPAFDAAAVFDAAAVPVSDSGFAANANVRRFVDDEVGKGDFSRAEWQDFFDKAAYKADIVKIMHRPSTSRPWYVFRTGNSGKAKFRGARRFYAENRALIDDVAQKYGVPAELIVAVIGIETNYGKNTGSFRVADALATLGFDYPRRAGFFQKELVELLKLAKEEGGDVFAFKGSYAGAMGMPQFMPSSYRKWAVDYDGDGHRDIWGNIGDVAASVANYMKQHGWRTGGKILVSATLAPGADVQAIIGEKTALTRTVADLKAYGIIPGEELADDEKAVLFKLETAPGVFEYYLGLNNFYTVWQYNHSRMYVTAVRDIANSLGGSGLMASSSSSKQAKPIHRMAWRLGVSLTLLLGLGALFVLPKFDPKSLTWPTTEPGRIAPLAMSGGNPYLRALMRTISASESNDASPYTVLYGGSHIENLQEHPDRCIPIRWGPNQGLCTTAAGRYQFITTTWLETAEKYHPAPTGEWMWRRYSFAPEYQDRVVYAWLDDVNYWGTDIPQLLEDGQLQTVLKRLSGTWTSLGYGIESNKVTPHLMHIYERMLAEEIALANGLPTNYLPTVANQSVETTRMIIQHSQPKRKGTKYRLKKPYKLVFNLIIVVGLIGLVYSFKKNTQPLVNPSLVTHLPELEMSGGDPYIRALMLTISASESNHKNSYYLLYGGSHVHNLQQHPDQCIPINIGPNRGNCSTAAGRYQFLNSTWQEKARKYHPNPQKNYRQYIYSFEPKYQDIVVYRWLKDHHQWNVDLLTLLKQDQVEEVLRKLSNVWTSLGGGIEDNSMTPHLPSIYRYFLAQELNRENADQNSLMVEINNQRKAFLDMLAWSEGTDNGRQKTRNHGYDVIVGGELFTDYSDHPRKLVTLNPKLKSTAAGRYQLLSRWWDAYRKQLGLKDFSPKSQDAVALQQIKERGALPMIDRGDIRQAIDRCSNIWASLPGAGYGQFEHKADSLIVKFKEAGGTVREIEVMGYTWKGLAKQYGFTDFSPATQDKAAVALILAKKGAMEAILNGDYEQAVMKLGGIWASFPTAPNEYRQHKRSWGFVHNFFRQRGFMARISAADAGGVNVIAFLDMLAWSEGTSTIKASDYGYDVLVGGKLFSEYSKHPRVKVWLPKYSIYSSAAGRYQFLAGTWDAIVKNYGFKGRFIPEAQDLAAIKLLTECGALPLIKAGRIVEAIAKAAPIWASLPGAGYGQREHKLAALLGIYEAERAAEAKPQDQLLAMFSACGGEMAAMTRYEFALLALAAVGYVVWRDWQRSEEPGAQSPDFIDQAENLFYDATEGNFFGGTEDTDMGQAQLNRAAFLLTIRTGEGTAGNDGYRMLFGGGKFDSFADHPRQVVTALSNGKPISSSAAGAYQFLRRTWDTLAARLGLTDFSPASQDAAALELIREAGALGDVDAGRFALAVRKVRKIWASMPGAGYGQPEVALERLQAAYQAAGGVVNGMPVINTHQNIAAFLDMLAYSEGTANHPLTKNRGYDVIVTSLDGRPEIFTDYSDHPFAHGRPAKVFNRRGEKSTASGRYQQLYMFWPHYKKQLALPDFSPLSQDKLAIQLIRERGAIDDIRAGRIERAVSRCRNIWASLPGAGYGQREHSLEKLVTVWRTAGGVVAMYSQQVQQINQPQKNSDIQLINMWLQQIHPIQQNSHLYIAQMFLKFIKKPLKKVTSADVIAFANVYGVRSHNSHSNQQKRIETINSLLKFGQEAGILPRNQKKTFSPNTTNFKTSVYSQNKIKNYRTTGKQQKKPLNWSQLFNLQLASSVLIVFILLMAILQLFRQVSGSTNANQNKSVTSVVMPKIDPTKNWAYPVNVPRIRAFLDTIAVTEGTTGPKGYYRQYTGSHFLSFEDHPRELKCANSNGKKLCSDAAGRYQFLSTSWDRFAPVVKAQNFSPTYQDRVAIELIRDKNALKDIEEGRVKEAFQKLYMVWPSFGETETDVEQLMPKLVGTYEQKLALYQIKNMDDEFERAFKKILDYEGGYSDEQKDHGGKTKYGITEKLARDYGHEGEMKDLELEKAKEIYYREFWANHLYSWIEDERIATEVFEQAVNMGAKTANKHLQKAYNLLADKEIAVDGIIGQRTLEAVNNFEHNSDLFKLLNILQAKKYINIVKNDASQQKFIRGWLRRVELDIDSRKSMKRNFQTVMPYIFSEEGGYADNPADPGGATNMGITINTLSAWEGRQVSPQDVKELTQATATQIYQVEFWNKIDGNDLPSGVDYALFDFAVNSGPGRAAKTLQKILAMPEDGIIGAQTVAAAAARSPEGIINALCDARAAWLRGLSTAATFGNGWLARVERVRARALALAATPPAITQPADPAGNPSPKARQADIAFTSALKHPEALGTMGSVASGLAAIATGNGPVQYALAIVMVACAGVGLWYFVRRVRSEPMNFDQAFDRLLGHEGGYSNNSADPGGETMWGVTARVARADGYLGEMRDLPRDRAKSIYRRLYWTPVRADELPEVVRFDVFDGAVNSGPAQSIKWLQRAAGAVDDGILGPRTMAAAVAAGPVLAARYNGHRLLFLADRPTWGSFGKGWARRVGKNLLGAMDQPPWLQAAWAEFGVREIPGKEDAPEILRYFRDAGDTNVETEATPWCAAFLGAMLKRAGYAGTGSLLARSYLDWGDRLDDARFGAVAVLSRGDDPNAGHVGFLLSDTNGKLYLLGGNQGDAVTVASFDKARLLGLRWPKENVEAASKGDDAIFSRVLAHVLEMEGGFSNDPYDPGGPTNRGITLEVYAKFRKETLDDGTRARLIAELKRIPDAIVTAIYRQRYFDPASCPVFTAPLALMHFDAAVNHGVGAAIRMLQGVAGVTVDGEIGPETLAAIGAKSLADLLDDYAETRRARYRALPHFWRFGRGWLKRVDATLALARTWAAAEATNRGLIEPQQIAKGEGKMGEKSKTEISSSDDSKWWLNSKTMWGTLITAAATVIPVLGPAVGIVLPADLITSFGDQVVTAAQALAGLFGTALAIYGRLKADTPLVLRKNMSAPLTFQQVFDRVVGHEGGYVNDPHDPGGETNWGITKYTARENGYTGSMKAMTREQAYKIYEKAFWQRYHCEKLPEAVAFQFFDAAVNHGVGNASRMLQRAVNVADDGIIGKVTLSAVEKMPISDLLLRFNAERIRFYTKLKNFPRYGKGWMNRIAGNLAYAAIDNEVMNPIIDGIIALEGGYVFNPKDKGGATHWGITEATARAHGYAGDMRDLTHAEAYAILEEDYWIKPGFDVISTLSWPVSFELCDAAVNIGAYHPSAWLQRWLNVFNHEGKRYPDIHVDGNIGPRTLAALEHYLAWRGQEGEAVLVKALNCSQGTYYLNVAEKNHNNEQFIYGWIKNRVTMDSFEDAFKALIGNEGGYSFNPADPGGETMWGVTARVARSEGYNGAMKDLPLETAHQIAKRRYWDPLHLDELDPRVAFQIFDANYNGGLVVLWMQKASGAKEDGKFGPDTLDAVKNADPMKFVMRFAAYRLRYLRNLHSWPSFSRGWTERMAANLLLGAAMSQTATLSDFNKAFDRVIQHEGGYVNDPRDAGGETKFGITIHTARANGYTGSMFTMTRDDAKQIYLKAFWQRYRCNEFPPELAFQFFDACVNHGSGNASRMLQRAVGVVDDGIIGEITLAAIRKRSTVEVVTLFNAERLEFYTKLSGFQHFGKGWIRRMAGNLRHIADDVGDK',
'target_names': [18, 19, 22, 23, 24, 25, 73, 102, 103, 104, 108],
'targets': array([ 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 2,
2, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 4, 4,
4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 5, 5, 5, 5, 6, 6, 6,
6, 6, 6, 6, 6, 7, 7, 7, 7, 7, 7, 7, 7, 8, 8, 8, 8,
8, 8, 8, 8, 9, 9, 9, 9, 9, 9, 9, 9, 10, 10, 10, 10, 10,
10, 10, 10])}
In [ ]:
data=bio.sequences_to_vectors(sequence_data,chunksize=5)
In [ ]:
summary(data)
here'a a little sanity check...
In [ ]:
print("original sequence:")
print("\t",sequence_data.data[0])
print("the first few chunks:")
for vector in data.vectors[:10]:
print("\t",bio.vector_to_sequence(vector,data.letters))
you only need to save to csv if you feel like looking at the vectors in Excel - usually you don't need to do this
In [ ]:
save_csv('small sequence dataset.csv',data)
In [ ]:
sequence_data_train=bio.load_sequences('data/small sequence dataset.xlsx')
sequence_data_test=bio.load_sequences('data/another small sequence dataset.xlsx')
In [ ]:
data_train,data_test=bio.sequences_to_vectors(sequence_data_train,sequence_data_test,chunksize=5)
Content source: bblais/Classy
Similar notebooks: